{"id":"https://openalex.org/W2033139628","doi":"https://doi.org/10.1145/1854273.1854313","title":"Partitioning streaming parallelism for multi-cores","display_name":"Partitioning streaming parallelism for multi-cores","publication_year":2010,"publication_date":"2010-09-11","ids":{"openalex":"https://openalex.org/W2033139628","doi":"https://doi.org/10.1145/1854273.1854313","mag":"2033139628"},"language":"en","primary_location":{"id":"doi:10.1145/1854273.1854313","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1854273.1854313","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th international conference on Parallel architectures and compilation techniques","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100401045","display_name":"Zheng Wang","orcid":"https://orcid.org/0000-0001-6157-0662"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Zheng Wang","raw_affiliation_strings":["University of Edinburgh, Edinburgh, United Kingdom","Institute for Computing Systems Architecture, School of Informatics, The University of Edinburgh, UK"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh, Edinburgh, United Kingdom","institution_ids":["https://openalex.org/I98677209"]},{"raw_affiliation_string":"Institute for Computing Systems Architecture, School of Informatics, The University of Edinburgh, UK","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027001025","display_name":"Michael O\u2019Boyle","orcid":"https://orcid.org/0000-0003-1619-5052"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Michael F.P. O'Boyle","raw_affiliation_strings":["University of Edinburgh, Edinburgh, United Kingdom","Institute for Computing Systems Architecture, School of Informatics, The University of Edinburgh, UK"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh, Edinburgh, United Kingdom","institution_ids":["https://openalex.org/I98677209"]},{"raw_affiliation_string":"Institute for Computing Systems Architecture, School of Informatics, The University of Edinburgh, UK","institution_ids":["https://openalex.org/I98677209"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100401045"],"corresponding_institution_ids":["https://openalex.org/I98677209"],"apc_list":null,"apc_paid":null,"fwci":6.0596,"has_fulltext":false,"cited_by_count":110,"citation_normalized_percentile":{"value":0.96690219,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"307","last_page":"318"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8995076417922974},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.775731086730957},{"id":"https://openalex.org/keywords/porting","display_name":"Porting","score":0.7206543684005737},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7091967463493347},{"id":"https://openalex.org/keywords/software-portability","display_name":"Software portability","score":0.70872962474823},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.6248570680618286},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5626276135444641},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.5550376772880554},{"id":"https://openalex.org/keywords/instruction-level-parallelism","display_name":"Instruction-level parallelism","score":0.5101462006568909},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.4843081533908844},{"id":"https://openalex.org/keywords/stream-processing","display_name":"Stream processing","score":0.47430041432380676},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.44492533802986145},{"id":"https://openalex.org/keywords/task-parallelism","display_name":"Task parallelism","score":0.4240502119064331},{"id":"https://openalex.org/keywords/very-long-instruction-word","display_name":"Very long instruction word","score":0.4132181406021118},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.32598012685775757},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.1903461515903473}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8995076417922974},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.775731086730957},{"id":"https://openalex.org/C106251023","wikidata":"https://www.wikidata.org/wiki/Q851989","display_name":"Porting","level":3,"score":0.7206543684005737},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7091967463493347},{"id":"https://openalex.org/C63000827","wikidata":"https://www.wikidata.org/wiki/Q3080428","display_name":"Software portability","level":2,"score":0.70872962474823},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.6248570680618286},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5626276135444641},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.5550376772880554},{"id":"https://openalex.org/C140763907","wikidata":"https://www.wikidata.org/wiki/Q2714055","display_name":"Instruction-level parallelism","level":3,"score":0.5101462006568909},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.4843081533908844},{"id":"https://openalex.org/C107027933","wikidata":"https://www.wikidata.org/wiki/Q2006448","display_name":"Stream processing","level":2,"score":0.47430041432380676},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.44492533802986145},{"id":"https://openalex.org/C42992933","wikidata":"https://www.wikidata.org/wiki/Q691169","display_name":"Task parallelism","level":3,"score":0.4240502119064331},{"id":"https://openalex.org/C170595534","wikidata":"https://www.wikidata.org/wiki/Q249743","display_name":"Very long instruction word","level":2,"score":0.4132181406021118},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.32598012685775757},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.1903461515903473},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1854273.1854313","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1854273.1854313","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th international conference on Parallel architectures and compilation techniques","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5978990263","display_name":null,"funder_award_id":"EP/G036136/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W1490760466","https://openalex.org/W1506806321","https://openalex.org/W1568192366","https://openalex.org/W1585610988","https://openalex.org/W1601795611","https://openalex.org/W1663973292","https://openalex.org/W1967846636","https://openalex.org/W1991495385","https://openalex.org/W1997806454","https://openalex.org/W2005082107","https://openalex.org/W2011601876","https://openalex.org/W2031775479","https://openalex.org/W2039417226","https://openalex.org/W2040466547","https://openalex.org/W2056579078","https://openalex.org/W2064757275","https://openalex.org/W2088899347","https://openalex.org/W2088921570","https://openalex.org/W2091158003","https://openalex.org/W2097717378","https://openalex.org/W2099459818","https://openalex.org/W2111171966","https://openalex.org/W2115852795","https://openalex.org/W2118937112","https://openalex.org/W2119537359","https://openalex.org/W2121696980","https://openalex.org/W2122080725","https://openalex.org/W2131958140","https://openalex.org/W2134260566","https://openalex.org/W2134408405","https://openalex.org/W2135342109","https://openalex.org/W2145406052","https://openalex.org/W2150476673","https://openalex.org/W2151406013","https://openalex.org/W2153456949","https://openalex.org/W2159456929","https://openalex.org/W2159560337","https://openalex.org/W2162539651","https://openalex.org/W2165100134","https://openalex.org/W2166536280","https://openalex.org/W2168175751","https://openalex.org/W2170058712","https://openalex.org/W2321248633","https://openalex.org/W4231589243","https://openalex.org/W4244494905","https://openalex.org/W6629451354","https://openalex.org/W6629510986","https://openalex.org/W7039202648"],"related_works":["https://openalex.org/W4240606930","https://openalex.org/W2526302199","https://openalex.org/W2003935582","https://openalex.org/W2950520577","https://openalex.org/W3007272028","https://openalex.org/W2040503315","https://openalex.org/W168408236","https://openalex.org/W2494130044","https://openalex.org/W2105992728","https://openalex.org/W1535590766"],"abstract_inverted_index":{"Stream":[0],"based":[1],"languages":[2],"are":[3,166],"a":[4,37,58,84,101,128,144,153,162],"popular":[5],"approach":[6,42,105,160],"to":[7,19,43,80,91,161,168],"expressing":[8],"parallelism":[9,18],"in":[10],"modern":[11],"applications.":[12],"The":[13],"efficient":[14],"mapping":[15],"of":[16,108,137,180],"streaming":[17,45,60],"multi-core":[20],"processors":[21],"is,":[22],"however,":[23],"highly":[24],"dependent":[25],"on":[26,126,151],"the":[27,53,68,73,109,132,138,173,178],"program":[28,74],"and":[29,39,82,95,116],"underlying":[30],"architecture.":[31],"We":[32,87,124],"address":[33],"this":[34,89],"by":[35,113],"developing":[36],"portable":[38],"automatic":[40],"compiler-based":[41],"partitioning":[44,135],"programs":[46],"using":[47,62],"machine":[48],"learning.":[49],"Our":[50],"technique":[51,90],"predicts":[52],"ideal":[54],"partition":[55],"structure":[56],"for":[57],"given":[59],"application":[61],"prior":[63],"knowledge":[64],"learned":[65],"off-line.":[66],"Using":[67],"predictor":[69],"we":[70,149,165],"rapidly":[71],"search":[72],"space":[75],"(without":[76],"executing":[77,117],"any":[78],"code)":[79],"generate":[81],"select":[83],"good":[85],"partition.":[86],"applied":[88],"standard":[92],"StreamIt":[93,139,174],"applications":[94],"compared":[96,142],"against":[97,143],"existing":[98],"approaches.":[99],"On":[100],"4-core":[102],"platform,":[103,164],"our":[104,159,181],"achieves":[106],"60%":[107],"best":[110],"performance":[111,155],"found":[112],"iteratively":[114],"compiling":[115],"over":[118,131,172],"3000":[119],"different":[120],"partitions":[121],"per":[122],"program.":[123],"obtain,":[125],"average,":[127,152],"1.90x":[129],"speedup":[130],"already":[133],"tuned":[134],"scheme":[136],"compiler.":[140],"When":[141],"state-of-the-art":[145],"analytical,":[146],"model-based":[147],"approach,":[148],"achieve,":[150],"1.77x":[154],"improvement.":[156],"By":[157],"porting":[158],"8-core":[163],"able":[167],"obtain":[169],"1.8x":[170],"improvement":[171],"default":[175],"scheme,":[176],"demonstrating":[177],"portability":[179],"approach.":[182]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":14},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":13},{"year":2017,"cited_by_count":17},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":7},{"year":2014,"cited_by_count":12},{"year":2013,"cited_by_count":13},{"year":2012,"cited_by_count":10}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
