{"id":"https://openalex.org/W2176686728","doi":"https://doi.org/10.1145/2809808","title":"On-the-Fly Pipeline Parallelism","display_name":"On-the-Fly Pipeline Parallelism","publication_year":2015,"publication_date":"2015-09-08","ids":{"openalex":"https://openalex.org/W2176686728","doi":"https://doi.org/10.1145/2809808","mag":"2176686728"},"language":"en","primary_location":{"id":"doi:10.1145/2809808","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2809808","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083447315","display_name":"I-Ting Angelina Lee","orcid":"https://orcid.org/0000-0002-0687-5508"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"I-Ting Angelina Lee","raw_affiliation_strings":["MIT CSAIL"],"affiliations":[{"raw_affiliation_string":"MIT CSAIL","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027618658","display_name":"Charles E. Leiserson","orcid":"https://orcid.org/0000-0001-6386-5552"},"institutions":[{"id":"https://openalex.org/I4210110987","display_name":"IIT@MIT","ror":"https://ror.org/01wp8zh54","country_code":"US","type":"facility","lineage":["https://openalex.org/I30771326","https://openalex.org/I4210110987"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Charles E. Leiserson","raw_affiliation_strings":["MIT CSAIL, Cambridge, MA"],"affiliations":[{"raw_affiliation_string":"MIT CSAIL, Cambridge, MA","institution_ids":["https://openalex.org/I4210110987"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018454153","display_name":"Tao B. Schardl","orcid":null},"institutions":[{"id":"https://openalex.org/I4210110987","display_name":"IIT@MIT","ror":"https://ror.org/01wp8zh54","country_code":"US","type":"facility","lineage":["https://openalex.org/I30771326","https://openalex.org/I4210110987"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tao B. Schardl","raw_affiliation_strings":["MIT CSAIL, Cambridge, MA"],"affiliations":[{"raw_affiliation_string":"MIT CSAIL, Cambridge, MA","institution_ids":["https://openalex.org/I4210110987"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022565558","display_name":"Zhunping Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210110987","display_name":"IIT@MIT","ror":"https://ror.org/01wp8zh54","country_code":"US","type":"facility","lineage":["https://openalex.org/I30771326","https://openalex.org/I4210110987"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhunping Zhang","raw_affiliation_strings":["MIT CSAIL, Cambridge, MA"],"affiliations":[{"raw_affiliation_string":"MIT CSAIL, Cambridge, MA","institution_ids":["https://openalex.org/I4210110987"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039750618","display_name":"Jim Sukha","orcid":null},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jim Sukha","raw_affiliation_strings":["Intel Corporation, Hudson, MA"],"affiliations":[{"raw_affiliation_string":"Intel Corporation, Hudson, MA","institution_ids":["https://openalex.org/I1343180700"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5083447315"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.6395,"has_fulltext":false,"cited_by_count":36,"citation_normalized_percentile":{"value":0.95070361,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"2","issue":"3","first_page":"1","last_page":"42"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8170408010482788},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7529681921005249},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7078492045402527},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.6913569569587708},{"id":"https://openalex.org/keywords/task-parallelism","display_name":"Task parallelism","score":0.5229264497756958},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.5041118860244751},{"id":"https://openalex.org/keywords/implicit-parallelism","display_name":"Implicit parallelism","score":0.49530282616615295},{"id":"https://openalex.org/keywords/instruction-level-parallelism","display_name":"Instruction-level parallelism","score":0.47537532448768616},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09768697619438171}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8170408010482788},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7529681921005249},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7078492045402527},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.6913569569587708},{"id":"https://openalex.org/C42992933","wikidata":"https://www.wikidata.org/wiki/Q691169","display_name":"Task parallelism","level":3,"score":0.5229264497756958},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.5041118860244751},{"id":"https://openalex.org/C3543717","wikidata":"https://www.wikidata.org/wiki/Q6007302","display_name":"Implicit parallelism","level":4,"score":0.49530282616615295},{"id":"https://openalex.org/C140763907","wikidata":"https://www.wikidata.org/wiki/Q2714055","display_name":"Instruction-level parallelism","level":3,"score":0.47537532448768616},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09768697619438171}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2809808","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2809808","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3052461425","display_name":null,"funder_award_id":"11621","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4977964089","display_name":"CSR: Small: Using Thread-Local Memory Mapping to Support Memory Abstractions for Dynamic Multithreading","funder_award_id":"1017058","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4980078154","display_name":null,"funder_award_id":"CNS-1017058, CCF-1162148","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6081516088","display_name":"SHF:  AF:  Medium:  Collaborative Research:The Ponchoir Stencil Complier","funder_award_id":"1162148","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6894402473","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320311330","display_name":"COMSATS Institute of Information Technology","ror":"https://ror.org/00nqqvk19"},{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"},{"id":"https://openalex.org/F4320335561","display_name":"Institute of Computing Technology, Chinese Academy of Sciences","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1491838213","https://openalex.org/W1507039213","https://openalex.org/W1545099940","https://openalex.org/W1931688030","https://openalex.org/W1967882079","https://openalex.org/W1971181882","https://openalex.org/W1982812416","https://openalex.org/W1984263429","https://openalex.org/W1995321227","https://openalex.org/W2006059438","https://openalex.org/W2009122662","https://openalex.org/W2015003898","https://openalex.org/W2016559894","https://openalex.org/W2034209740","https://openalex.org/W2034896142","https://openalex.org/W2044872254","https://openalex.org/W2072725684","https://openalex.org/W2090247159","https://openalex.org/W2098147619","https://openalex.org/W2100156365","https://openalex.org/W2104342377","https://openalex.org/W2105321788","https://openalex.org/W2112250971","https://openalex.org/W2123914565","https://openalex.org/W2128294826","https://openalex.org/W2135063076","https://openalex.org/W2140199336","https://openalex.org/W2143592587","https://openalex.org/W2145406052","https://openalex.org/W2147536281","https://openalex.org/W2151307463","https://openalex.org/W2157758640","https://openalex.org/W2165100134","https://openalex.org/W2167396549","https://openalex.org/W2169706611","https://openalex.org/W2169875292","https://openalex.org/W2171546589","https://openalex.org/W2987803397","https://openalex.org/W3138993548","https://openalex.org/W4232919122"],"related_works":["https://openalex.org/W2003935582","https://openalex.org/W1501159154","https://openalex.org/W2950520577","https://openalex.org/W74409296","https://openalex.org/W2105992728","https://openalex.org/W2468095077","https://openalex.org/W2494130044","https://openalex.org/W305742777","https://openalex.org/W1554644772","https://openalex.org/W1991844655"],"abstract_inverted_index":{"Pipeline":[0,45],"parallelism":[1,46,90,121,147,162,171,247,277],"organizes":[2],"a":[3,7,17,33,68,92,116,150,164,188,249,318],"parallel":[4],"program":[5,110],"as":[6,80,108,261],"linear":[8],"sequence":[9],"of":[10,16,63,104,125,283,320],"stages.":[11],"Each":[12],"stage":[13],"processes":[14],"elements":[15],"data":[18,23,137],"stream,":[19],"passing":[20],"each":[21],"processed":[22],"element":[24,35],"to":[25,127,131,135,172,278],"the":[26,37,102,105,109,123,155,182,204,270],"next":[27],"stage,":[28],"and":[29,57,133,148,169,195,264,308],"then":[30],"taking":[31],"on":[32,206,280,329],"new":[34],"before":[36],"subsequent":[38],"stages":[39,126],"have":[40,243,268],"necessarily":[41],"completed":[42],"their":[43],"processing.":[44,60],"is":[47],"used":[48],"especially":[49],"in":[50,66,209],"streaming":[51],"applications":[52],"that":[53,87,233,274,293,302],"perform":[54],"video,":[55],"audio,":[56],"digital":[58],"signal":[59],"Three":[61],"out":[62],"13":[64],"benchmarks":[65,273],"PARSEC,":[67],"popular":[69],"software":[70],"benchmark":[71],"suite":[72],"designed":[73],"for":[74,143,314],"shared-memory":[75],"multiprocessors,":[76],"can":[77],"be":[78,136,173,289],"expressed":[79],"pipeline":[81,89,99,106,120,146,161,168,189,246,276,297],"parallelism.":[82,298],"Whereas":[83],"most":[84],"concurrency":[85],"platforms":[86],"support":[88,294],"use":[91],"\u201cconstruct-and-run\u201d":[93],"approach,":[94],"this":[95],"article":[96],"investigates":[97],"\u201con-the-fly\u201d":[98],"parallelism,":[100,183],"where":[101],"structure":[103],"emerges":[107],"executes":[111,203],"rather":[112],"than":[113],"being":[114],"specified":[115],"priori":[117],".":[118],"On-the-fly":[119],"allows":[122],"number":[124],"vary":[128],"from":[129],"iteration":[130,132],"dependencies":[134],"dependent.":[138],"We":[139,242,267],"propose":[140],"simple":[141],"linguistics":[142],"specifying":[144],"on-the-fly":[145,245],"describe":[149],"provably":[151],"efficient":[152],"scheduling":[153],"algorithm,":[154,158],"P":[156,177,201,207,211,216,222,226],"iper":[157,178,202,227],"which":[159],"integrates":[160],"into":[163,248],"work-stealing":[165,251],"scheduler,":[166],"allowing":[167],"fork-join":[170],"arbitrarily":[174],"nested.":[175],"The":[176],"algorithm":[179],"automatically":[180],"throttles":[181],"precluding":[184],"\u201crunaway\u201d":[185],"pipelines.":[186],"Given":[187],"computation":[190,205],"with":[191,239],"T":[192,196,210,213,220],"1":[193,214],"work":[194],"\u221e":[197],"span":[198],"(critical-path":[199],"length),":[200],"processors":[208],"\u2264":[212],"/":[215],"+":[217],"O":[218],"(":[219],"\u221e+lg":[221],")":[223],"expected":[224],"time.":[225,241],"also":[228],"limits":[229],"stack":[230],"space,":[231],"ensuring":[232],"it":[234],"does":[235],"not":[236],"grow":[237],"unboundedly":[238],"running":[240,328],"incorporated":[244],"Cilk-based":[250],"runtime":[252],"system.":[253],"Our":[254],"prototype":[255],"Cilk-P":[256,303,316],"implementation":[257],"exploits":[258],"optimizations":[259],"such":[260],"\u201clazy":[262],"enabling\u201d":[263],"\u201cdependency":[265],"folding.\u201d":[266],"ported":[269],"three":[271],"PARSEC":[272],"exhibit":[275],"run":[279],"Cilk-P.":[281],"One":[282],"these,":[284],"x264":[285,312],",":[286,313],"cannot":[287],"readily":[288],"executed":[290],"by":[291],"systems":[292],"only":[295],"construct-and-run":[296],"Benchmark":[299],"results":[300],"indicate":[301],"has":[304],"low":[305],"serial":[306,325],"overhead":[307],"good":[309],"scalability.":[310],"On":[311],"example,":[315],"exhibits":[317],"speedup":[319],"13.87":[321],"over":[322],"its":[323],"respective":[324],"counterpart":[326],"when":[327],"16":[330],"processors.":[331]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":8},{"year":2017,"cited_by_count":6}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
