{"id":"https://openalex.org/W2293274942","doi":"https://doi.org/10.1145/2892208.2892214","title":"Performance implications of transient loop-carried data dependences in automatically parallelized loops","display_name":"Performance implications of transient loop-carried data dependences in automatically parallelized loops","publication_year":2016,"publication_date":"2016-03-14","ids":{"openalex":"https://openalex.org/W2293274942","doi":"https://doi.org/10.1145/2892208.2892214","mag":"2293274942"},"language":"en","primary_location":{"id":"doi:10.1145/2892208.2892214","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2892208.2892214","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 25th International Conference on Compiler Construction","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.repository.cam.ac.uk/bitstreams/e368ecac-9567-41fd-8f4c-08ca0fe5bef6/download","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046803418","display_name":"Niall Murphy","orcid":"https://orcid.org/0000-0003-2559-3335"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Niall Murphy","raw_affiliation_strings":["University of Cambridge, UK"],"affiliations":[{"raw_affiliation_string":"University of Cambridge, UK","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047443783","display_name":"Timothy M. Jones","orcid":"https://orcid.org/0000-0002-4114-7661"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Timothy Jones","raw_affiliation_strings":["University of Cambridge, UK"],"affiliations":[{"raw_affiliation_string":"University of Cambridge, UK","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040762162","display_name":"Robert Mullins","orcid":"https://orcid.org/0000-0002-8393-2748"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Robert Mullins","raw_affiliation_strings":["University of Cambridge, UK"],"affiliations":[{"raw_affiliation_string":"University of Cambridge, UK","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084389543","display_name":"Simone Campanoni","orcid":"https://orcid.org/0000-0001-9806-7016"},"institutions":[{"id":"https://openalex.org/I111979921","display_name":"Northwestern University","ror":"https://ror.org/000e0be47","country_code":"US","type":"education","lineage":["https://openalex.org/I111979921"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Simone Campanoni","raw_affiliation_strings":["Northwestern University, USA"],"affiliations":[{"raw_affiliation_string":"Northwestern University, USA","institution_ids":["https://openalex.org/I111979921"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5046803418"],"corresponding_institution_ids":["https://openalex.org/I241749"],"apc_list":null,"apc_paid":null,"fwci":2.5683,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.8846786,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"23","last_page":"33"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8452029228210449},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.8371431827545166},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.7322331666946411},{"id":"https://openalex.org/keywords/speculative-multithreading","display_name":"Speculative multithreading","score":0.6503679156303406},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.5760587453842163},{"id":"https://openalex.org/keywords/speculative-execution","display_name":"Speculative execution","score":0.5478963851928711},{"id":"https://openalex.org/keywords/automatic-parallelization","display_name":"Automatic parallelization","score":0.49381527304649353},{"id":"https://openalex.org/keywords/interconnection","display_name":"Interconnection","score":0.4892539978027344},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.4666787385940552},{"id":"https://openalex.org/keywords/task-parallelism","display_name":"Task parallelism","score":0.461153507232666},{"id":"https://openalex.org/keywords/instruction-level-parallelism","display_name":"Instruction-level parallelism","score":0.45337364077568054},{"id":"https://openalex.org/keywords/loop-tiling","display_name":"Loop tiling","score":0.4293639361858368},{"id":"https://openalex.org/keywords/dependence-analysis","display_name":"Dependence analysis","score":0.421263724565506},{"id":"https://openalex.org/keywords/loop","display_name":"Loop (graph theory)","score":0.4210142493247986},{"id":"https://openalex.org/keywords/multithreading","display_name":"Multithreading","score":0.3848378658294678},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.3689146637916565},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.16666865348815918}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8452029228210449},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.8371431827545166},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.7322331666946411},{"id":"https://openalex.org/C15296174","wikidata":"https://www.wikidata.org/wiki/Q7575343","display_name":"Speculative multithreading","level":4,"score":0.6503679156303406},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.5760587453842163},{"id":"https://openalex.org/C141331961","wikidata":"https://www.wikidata.org/wiki/Q2164465","display_name":"Speculative execution","level":2,"score":0.5478963851928711},{"id":"https://openalex.org/C164833996","wikidata":"https://www.wikidata.org/wiki/Q2323839","display_name":"Automatic parallelization","level":3,"score":0.49381527304649353},{"id":"https://openalex.org/C123745756","wikidata":"https://www.wikidata.org/wiki/Q1665949","display_name":"Interconnection","level":2,"score":0.4892539978027344},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.4666787385940552},{"id":"https://openalex.org/C42992933","wikidata":"https://www.wikidata.org/wiki/Q691169","display_name":"Task parallelism","level":3,"score":0.461153507232666},{"id":"https://openalex.org/C140763907","wikidata":"https://www.wikidata.org/wiki/Q2714055","display_name":"Instruction-level parallelism","level":3,"score":0.45337364077568054},{"id":"https://openalex.org/C11799548","wikidata":"https://www.wikidata.org/wiki/Q6675847","display_name":"Loop tiling","level":3,"score":0.4293639361858368},{"id":"https://openalex.org/C27390822","wikidata":"https://www.wikidata.org/wiki/Q320724","display_name":"Dependence analysis","level":2,"score":0.421263724565506},{"id":"https://openalex.org/C184670325","wikidata":"https://www.wikidata.org/wiki/Q512604","display_name":"Loop (graph theory)","level":2,"score":0.4210142493247986},{"id":"https://openalex.org/C201410400","wikidata":"https://www.wikidata.org/wiki/Q1064412","display_name":"Multithreading","level":3,"score":0.3848378658294678},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.3689146637916565},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.16666865348815918},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2892208.2892214","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2892208.2892214","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 25th International Conference on Compiler Construction","raw_type":"proceedings-article"},{"id":"pmh:oai:www.repository.cam.ac.uk:1810/254463","is_oa":true,"landing_page_url":"https://www.repository.cam.ac.uk/handle/1810/254463","pdf_url":"https://www.repository.cam.ac.uk/bitstreams/e368ecac-9567-41fd-8f4c-08ca0fe5bef6/download","source":{"id":"https://openalex.org/S4306401777","display_name":"Apollo (University of Cambridge)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I241749","host_organization_name":"University of Cambridge","host_organization_lineage":["https://openalex.org/I241749"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":{"id":"pmh:oai:www.repository.cam.ac.uk:1810/254463","is_oa":true,"landing_page_url":"https://www.repository.cam.ac.uk/handle/1810/254463","pdf_url":"https://www.repository.cam.ac.uk/bitstreams/e368ecac-9567-41fd-8f4c-08ca0fe5bef6/download","source":{"id":"https://openalex.org/S4306401777","display_name":"Apollo (University of Cambridge)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I241749","host_organization_name":"University of Cambridge","host_organization_lineage":["https://openalex.org/I241749"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3661743248","display_name":null,"funder_award_id":"EP/K026399/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G5649999263","display_name":null,"funder_award_id":"EP/G033110/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G5787069064","display_name":null,"funder_award_id":"EP/K026399/1 & EP/G033110/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2293274942.pdf","grobid_xml":"https://content.openalex.org/works/W2293274942.grobid-xml"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W79448102","https://openalex.org/W1491178396","https://openalex.org/W1525663018","https://openalex.org/W1544629082","https://openalex.org/W1557543533","https://openalex.org/W1582004751","https://openalex.org/W1964354616","https://openalex.org/W1977838359","https://openalex.org/W1980385176","https://openalex.org/W1982812416","https://openalex.org/W1986913310","https://openalex.org/W1990008205","https://openalex.org/W1990919222","https://openalex.org/W1990941549","https://openalex.org/W2008313934","https://openalex.org/W2010204191","https://openalex.org/W2037462607","https://openalex.org/W2046699259","https://openalex.org/W2047738780","https://openalex.org/W2067354926","https://openalex.org/W2096053480","https://openalex.org/W2100430002","https://openalex.org/W2103642785","https://openalex.org/W2112495948","https://openalex.org/W2116170858","https://openalex.org/W2119393363","https://openalex.org/W2128249697","https://openalex.org/W2129192659","https://openalex.org/W2136798749","https://openalex.org/W2142074538","https://openalex.org/W2148709764","https://openalex.org/W2151307463","https://openalex.org/W2158308706","https://openalex.org/W2159811471","https://openalex.org/W2167089275","https://openalex.org/W2171546589","https://openalex.org/W2296006986","https://openalex.org/W2296218291","https://openalex.org/W2537115708","https://openalex.org/W2611703827","https://openalex.org/W2626821661","https://openalex.org/W6683909398"],"related_works":["https://openalex.org/W3196293061","https://openalex.org/W2034886984","https://openalex.org/W4387670486","https://openalex.org/W2969801138","https://openalex.org/W2269131302","https://openalex.org/W3012385591","https://openalex.org/W2004692581","https://openalex.org/W3000039653","https://openalex.org/W2897479034","https://openalex.org/W2146081545"],"abstract_inverted_index":{"Recent":[0],"approaches":[1,102],"to":[2,77,103],"automatic":[3],"parallelization":[4],"have":[5],"taken":[6],"advantage":[7,105],"of":[8,57,95,106,110,134,146],"the":[9,50,55,66,79,84,107,124,135,141,144],"low-latency":[10],"on-chip":[11],"interconnect":[12],"provided":[13],"in":[14,40],"modern":[15],"multicore":[16],"processors,":[17],"demonstrating":[18],"significant":[19,31,58],"speedups,":[20],"even":[21],"for":[22],"complex":[23],"workloads.":[24],"Although":[25],"these":[26,111],"techniques":[27],"can":[28],"already":[29],"extract":[30],"thread-level":[32,60,148],"parallelism":[33,61],"from":[34],"application":[35],"loops,":[36],"we":[37],"are":[38,88],"interested":[39],"quantifying":[41],"and":[42,137],"exploiting":[43],"any":[44],"additional":[45,80],"performance":[46,81],"that":[47,122],"remains":[48],"on":[49,91],"table.":[51],"This":[52],"paper":[53],"confirms":[54],"existence":[56],"extra":[59],"within":[62],"loops":[63],"parallelized":[64],"by":[65],"HELIX":[67],"compiler.":[68],"However,":[69],"improving":[70],"static":[71],"data":[72,112,126],"dependence":[73,127],"analysis":[74,128],"is":[75],"unable":[76],"reach":[78],"offered":[82],"because":[83],"existing":[85],"loop-carried":[86],"dependences":[87,113],"true":[89],"only":[90],"a":[92],"small":[93],"subset":[94],"loop":[96],"iterations.":[97],"We":[98],"therefore":[99],"develop":[100],"three":[101],"take":[104],"transient":[108],"nature":[109],"through":[114],"speculation,":[115],"via":[116],"transactional":[117],"memory":[118],"support.":[119],"Results":[120],"show":[121],"coupling":[123],"state-of-the-art":[125],"with":[129],"fine-grained":[130],"speculation":[131],"achieves":[132],"most":[133],"speedups":[136],"may":[138],"help":[139],"close":[140],"gap":[142],"towards":[143],"limit":[145],"HELIX-style":[147],"parallelism.":[149]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
