{"id":"https://openalex.org/W2164738518","doi":"https://doi.org/10.1109/hpca.2008.4658647","title":"Uncovering hidden loop level parallelism in sequential applications","display_name":"Uncovering hidden loop level parallelism in sequential applications","publication_year":2008,"publication_date":"2008-02-01","ids":{"openalex":"https://openalex.org/W2164738518","doi":"https://doi.org/10.1109/hpca.2008.4658647","mag":"2164738518"},"language":"en","primary_location":{"id":"doi:10.1109/hpca.2008.4658647","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca.2008.4658647","pdf_url":null,"source":{"id":"https://openalex.org/S4210184388","display_name":"Proceedings - International Symposium on High-Performance Computer Architecture/Proceedings","issn_l":"1530-0897","issn":["1530-0897","2378-203X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 IEEE 14th International Symposium on High Performance Computer Architecture","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042859357","display_name":"Hongtao Zhong","orcid":"https://orcid.org/0000-0003-2527-4246"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hongtao Zhong","raw_affiliation_strings":["Advanced Computer Architecture Laboratory, University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"Advanced Computer Architecture Laboratory, University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014835828","display_name":"Mojtaba Mehrara","orcid":null},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mojtaba Mehrara","raw_affiliation_strings":["Advanced Computer Architecture Laboratory, University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"Advanced Computer Architecture Laboratory, University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084753957","display_name":"Steve Lieberman","orcid":null},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Steve Lieberman","raw_affiliation_strings":["Advanced Computer Architecture Laboratory, University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"Advanced Computer Architecture Laboratory, University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002075773","display_name":"Scott Mahlke","orcid":"https://orcid.org/0000-0002-0438-0616"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Scott Mahlke","raw_affiliation_strings":["Advanced Computer Architecture Laboratory, University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"Advanced Computer Architecture Laboratory, University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5042859357"],"corresponding_institution_ids":["https://openalex.org/I27837315"],"apc_list":null,"apc_paid":null,"fwci":13.1711,"has_fulltext":false,"cited_by_count":103,"citation_normalized_percentile":{"value":0.98963852,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"290","last_page":"301"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8757061958312988},{"id":"https://openalex.org/keywords/speculative-multithreading","display_name":"Speculative multithreading","score":0.8118681311607361},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7637780904769897},{"id":"https://openalex.org/keywords/task-parallelism","display_name":"Task parallelism","score":0.7502812147140503},{"id":"https://openalex.org/keywords/instruction-level-parallelism","display_name":"Instruction-level parallelism","score":0.6705071330070496},{"id":"https://openalex.org/keywords/implicit-parallelism","display_name":"Implicit parallelism","score":0.6582362055778503},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.6502193808555603},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.5730408430099487},{"id":"https://openalex.org/keywords/serialization","display_name":"Serialization","score":0.5587025284767151},{"id":"https://openalex.org/keywords/programmer","display_name":"Programmer","score":0.5484477281570435},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.5341158509254456},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5224846005439758},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.5114496946334839},{"id":"https://openalex.org/keywords/automatic-parallelization","display_name":"Automatic parallelization","score":0.4871065616607666},{"id":"https://openalex.org/keywords/speculative-execution","display_name":"Speculative execution","score":0.45611804723739624},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.4421316385269165},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.3894862234592438},{"id":"https://openalex.org/keywords/multithreading","display_name":"Multithreading","score":0.37632986903190613},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.35359692573547363},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.300912082195282}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8757061958312988},{"id":"https://openalex.org/C15296174","wikidata":"https://www.wikidata.org/wiki/Q7575343","display_name":"Speculative multithreading","level":4,"score":0.8118681311607361},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7637780904769897},{"id":"https://openalex.org/C42992933","wikidata":"https://www.wikidata.org/wiki/Q691169","display_name":"Task parallelism","level":3,"score":0.7502812147140503},{"id":"https://openalex.org/C140763907","wikidata":"https://www.wikidata.org/wiki/Q2714055","display_name":"Instruction-level parallelism","level":3,"score":0.6705071330070496},{"id":"https://openalex.org/C3543717","wikidata":"https://www.wikidata.org/wiki/Q6007302","display_name":"Implicit parallelism","level":4,"score":0.6582362055778503},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.6502193808555603},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.5730408430099487},{"id":"https://openalex.org/C52723943","wikidata":"https://www.wikidata.org/wiki/Q1127410","display_name":"Serialization","level":2,"score":0.5587025284767151},{"id":"https://openalex.org/C2778514511","wikidata":"https://www.wikidata.org/wiki/Q1374194","display_name":"Programmer","level":2,"score":0.5484477281570435},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.5341158509254456},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5224846005439758},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.5114496946334839},{"id":"https://openalex.org/C164833996","wikidata":"https://www.wikidata.org/wiki/Q2323839","display_name":"Automatic parallelization","level":3,"score":0.4871065616607666},{"id":"https://openalex.org/C141331961","wikidata":"https://www.wikidata.org/wiki/Q2164465","display_name":"Speculative execution","level":2,"score":0.45611804723739624},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4421316385269165},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.3894862234592438},{"id":"https://openalex.org/C201410400","wikidata":"https://www.wikidata.org/wiki/Q1064412","display_name":"Multithreading","level":3,"score":0.37632986903190613},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.35359692573547363},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.300912082195282}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca.2008.4658647","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca.2008.4658647","pdf_url":null,"source":{"id":"https://openalex.org/S4210184388","display_name":"Proceedings - International Symposium on High-Performance Computer Architecture/Proceedings","issn_l":"1530-0897","issn":["1530-0897","2378-203X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 IEEE 14th International Symposium on High Performance Computer Architecture","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5899999737739563,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W12207660","https://openalex.org/W1494930385","https://openalex.org/W1498870995","https://openalex.org/W1500590019","https://openalex.org/W1507552563","https://openalex.org/W1542975293","https://openalex.org/W1958945689","https://openalex.org/W1974831646","https://openalex.org/W1980999196","https://openalex.org/W1982812416","https://openalex.org/W2010220656","https://openalex.org/W2024547254","https://openalex.org/W2026585559","https://openalex.org/W2029050247","https://openalex.org/W2037078217","https://openalex.org/W2037462607","https://openalex.org/W2100184706","https://openalex.org/W2108795365","https://openalex.org/W2109502721","https://openalex.org/W2110710544","https://openalex.org/W2116299797","https://openalex.org/W2117269195","https://openalex.org/W2117285153","https://openalex.org/W2122545654","https://openalex.org/W2125340270","https://openalex.org/W2136798749","https://openalex.org/W2136958529","https://openalex.org/W2143535196","https://openalex.org/W2148255965","https://openalex.org/W2148390433","https://openalex.org/W2149473197","https://openalex.org/W2150007533","https://openalex.org/W2150334562","https://openalex.org/W2151373640","https://openalex.org/W2155312437","https://openalex.org/W2155410188","https://openalex.org/W2162523628","https://openalex.org/W2163488221","https://openalex.org/W2296006986","https://openalex.org/W3149553891","https://openalex.org/W4229693072","https://openalex.org/W4241739990","https://openalex.org/W4244452576","https://openalex.org/W4246485703","https://openalex.org/W4249006057","https://openalex.org/W4252176599","https://openalex.org/W4253095404","https://openalex.org/W4254179222","https://openalex.org/W4256302135","https://openalex.org/W6629849406","https://openalex.org/W6632361503","https://openalex.org/W6826581013"],"related_works":["https://openalex.org/W2034886984","https://openalex.org/W2135470015","https://openalex.org/W2905048389","https://openalex.org/W3012114143","https://openalex.org/W4247496551","https://openalex.org/W1972872690","https://openalex.org/W2126220043","https://openalex.org/W1567437828","https://openalex.org/W2274823567","https://openalex.org/W2121420032"],"abstract_inverted_index":{"As":[0],"multicore":[1],"systems":[2],"become":[3],"the":[4,11,15,19,33,58,61,72,91,97,105,159,182,190,199],"dominant":[5],"mainstream":[6],"computing":[7],"technology,":[8],"one":[9],"of":[10,25,35,64,75,84,99,107,147,169,198,202,223],"most":[12],"difficult":[13,62],"challenges":[14],"industry":[16],"faces":[17],"is":[18,53,80,150,162],"software.":[20,78,101],"Applications":[21],"with":[22,32,45,208],"large":[23],"amounts":[24,146],"explicit":[26],"thread-level":[27,216],"parallelism":[28,138,149],"naturally":[29],"scale":[30],"performance":[31,126],"number":[34,168],"cores,":[36],"but":[37,90,155],"single-threaded":[38,77,140],"applications":[39],"realize":[40],"little":[41],"to":[42,50,123,188,212,231],"no":[43],"gains":[44],"additional":[46],"cores.":[47],"One":[48],"solution":[49],"this":[51,119,129],"problem":[52,106],"automatic":[54,85],"parallelization":[55,86,186],"that":[56,115,144,196],"frees":[57],"programmer":[59],"from":[60,181],"task":[63],"parallel":[65],"programming":[66],"and":[67,161,171,176,184],"offers":[68],"hope":[69],"for":[70,87],"handling":[71],"vast":[73],"amount":[74],"legacy":[76],"There":[79],"a":[81,166,221,226],"long":[82],"history":[83],"scientific":[88,185],"applications,":[89,154],"techniques":[92,210],"have":[93],"generally":[94],"failed":[95],"in":[96,139,152,220],"context":[98],"general-purpose":[100,153],"Thread-level":[102],"speculation":[103,217],"overcomes":[104],"memory":[108],"dependence":[109],"analysis":[110],"by":[111,165],"speculating":[112],"unlikely":[113],"dependences":[114],"serialize":[116],"execution.":[117],"However,":[118],"approach":[120],"has":[121],"lead":[122],"only":[124],"modest":[125],"gains.":[127],"In":[128],"paper,":[130],"we":[131],"take":[132],"another":[133],"look":[134],"at":[135],"exploiting":[136],"loop-level":[137,148],"applications.":[141],"We":[142,174],"show":[143,195],"substantial":[145],"available":[151],"it":[156],"lurks":[157],"beneath":[158],"surface":[160],"often":[163],"obfuscated":[164],"small":[167],"data":[170],"control":[172],"dependences.":[173],"adapt":[175],"extend":[177],"several":[178],"code":[179],"transformations":[180],"instruction-level":[183],"communities":[187],"uncover":[189],"hidden":[191],"parallelism.":[192],"Our":[193],"results":[194],"61%":[197],"dynamic":[200],"execution":[201],"studied":[203],"benchmarks":[204],"can":[205],"be":[206],"parallelized":[207],"our":[209],"compared":[211,230],"27%":[213],"using":[214],"traditional":[215],"techniques,":[218],"resulting":[219],"speedup":[222],"1.84":[224],"on":[225],"four":[227],"core":[228],"system":[229],"1.41":[232],"without":[233],"transformations.":[234]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":6},{"year":2014,"cited_by_count":13},{"year":2013,"cited_by_count":7},{"year":2012,"cited_by_count":21}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
