{"id":"https://openalex.org/W2100788418","doi":"https://doi.org/10.1145/2155620.2155654","title":"Complementing user-level coarse-grain parallelism with implicit speculative parallelism","display_name":"Complementing user-level coarse-grain parallelism with implicit speculative parallelism","publication_year":2011,"publication_date":"2011-12-03","ids":{"openalex":"https://openalex.org/W2100788418","doi":"https://doi.org/10.1145/2155620.2155654","mag":"2100788418"},"language":"en","primary_location":{"id":"doi:10.1145/2155620.2155654","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2155620.2155654","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 44th Annual IEEE/ACM International Symposium on Microarchitecture","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://era.ed.ac.uk/bitstream/1842/7900/2/Ioannou2012.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054351615","display_name":"Nikolas Ioannou","orcid":null},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nikolas Ioannou","raw_affiliation_strings":["University of Edinburgh","Sch. of Informatics, Univ. of Edinburgh, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]},{"raw_affiliation_string":"Sch. of Informatics, Univ. of Edinburgh, UK","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090902844","display_name":"Marcelo Cintra","orcid":null},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]},{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Marcelo Cintra","raw_affiliation_strings":["Intel Labs","Sch. of Informatics, Univ. of Edinburgh, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intel Labs","institution_ids":["https://openalex.org/I1343180700"]},{"raw_affiliation_string":"Sch. of Informatics, Univ. of Edinburgh, UK","institution_ids":["https://openalex.org/I98677209"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.0305,"has_fulltext":true,"cited_by_count":10,"citation_normalized_percentile":{"value":0.78506996,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"284","last_page":"295"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8437952995300293},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7205725908279419},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6948215961456299},{"id":"https://openalex.org/keywords/instruction-level-parallelism","display_name":"Instruction-level parallelism","score":0.6802522540092468},{"id":"https://openalex.org/keywords/implicit-parallelism","display_name":"Implicit parallelism","score":0.6742157936096191},{"id":"https://openalex.org/keywords/task-parallelism","display_name":"Task parallelism","score":0.6509933471679688},{"id":"https://openalex.org/keywords/posix-threads","display_name":"POSIX Threads","score":0.614946722984314},{"id":"https://openalex.org/keywords/speculative-multithreading","display_name":"Speculative multithreading","score":0.5828484296798706},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5781069993972778},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.543470025062561},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.485110878944397},{"id":"https://openalex.org/keywords/multithreading","display_name":"Multithreading","score":0.45133477449417114},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.4482640027999878},{"id":"https://openalex.org/keywords/speculative-execution","display_name":"Speculative execution","score":0.42552316188812256},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.4201989769935608},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1510104537010193}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8437952995300293},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7205725908279419},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6948215961456299},{"id":"https://openalex.org/C140763907","wikidata":"https://www.wikidata.org/wiki/Q2714055","display_name":"Instruction-level parallelism","level":3,"score":0.6802522540092468},{"id":"https://openalex.org/C3543717","wikidata":"https://www.wikidata.org/wiki/Q6007302","display_name":"Implicit parallelism","level":4,"score":0.6742157936096191},{"id":"https://openalex.org/C42992933","wikidata":"https://www.wikidata.org/wiki/Q691169","display_name":"Task parallelism","level":3,"score":0.6509933471679688},{"id":"https://openalex.org/C41138395","wikidata":"https://www.wikidata.org/wiki/Q928112","display_name":"POSIX Threads","level":3,"score":0.614946722984314},{"id":"https://openalex.org/C15296174","wikidata":"https://www.wikidata.org/wiki/Q7575343","display_name":"Speculative multithreading","level":4,"score":0.5828484296798706},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5781069993972778},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.543470025062561},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.485110878944397},{"id":"https://openalex.org/C201410400","wikidata":"https://www.wikidata.org/wiki/Q1064412","display_name":"Multithreading","level":3,"score":0.45133477449417114},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.4482640027999878},{"id":"https://openalex.org/C141331961","wikidata":"https://www.wikidata.org/wiki/Q2164465","display_name":"Speculative execution","level":2,"score":0.42552316188812256},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.4201989769935608},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1510104537010193},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1145/2155620.2155654","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2155620.2155654","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 44th Annual IEEE/ACM International Symposium on Microarchitecture","raw_type":"proceedings-article"},{"id":"pmh:oai:era.ed.ac.uk:1842/7900","is_oa":true,"landing_page_url":"http://hdl.handle.net/1842/7900","pdf_url":"https://era.ed.ac.uk/bitstream/1842/7900/2/Ioannou2012.pdf","source":{"id":"https://openalex.org/S7407055182","display_name":"ERA","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PhD Doctor of Philosophy"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.908.5752","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.908.5752","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://researcher.ibm.com/researcher/files/zurich-NIO/micro11_slides.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.913.6180","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.913.6180","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://researcher.watson.ibm.com/researcher/files/zurich-NIO/micro11.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.928.1339","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.928.1339","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://homepages.inf.ed.ac.uk/mc/Publications/micro11.pdf","raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:era.ed.ac.uk:1842/7900","is_oa":true,"landing_page_url":"http://hdl.handle.net/1842/7900","pdf_url":"https://era.ed.ac.uk/bitstream/1842/7900/2/Ioannou2012.pdf","source":{"id":"https://openalex.org/S7407055182","display_name":"ERA","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PhD Doctor of Philosophy"},"sustainable_development_goals":[{"score":0.9100000262260437,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G1189752554","display_name":"Machine Learning for Thread Level Speculation on Multicore Architectures","funder_award_id":"EP/G000697/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G6256893149","display_name":null,"funder_award_id":"HiPEAC IST-004408","funder_id":"https://openalex.org/F4320334962","funder_display_name":"Sixth Framework Programme"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"},{"id":"https://openalex.org/F4320334962","display_name":"Sixth Framework Programme","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2100788418.pdf","grobid_xml":"https://content.openalex.org/works/W2100788418.grobid-xml"},"referenced_works_count":109,"referenced_works":["https://openalex.org/W75086091","https://openalex.org/W1481234801","https://openalex.org/W1525227808","https://openalex.org/W1551889632","https://openalex.org/W1579674405","https://openalex.org/W1589943916","https://openalex.org/W1600369258","https://openalex.org/W1916709771","https://openalex.org/W1958945689","https://openalex.org/W1963560066","https://openalex.org/W1968409088","https://openalex.org/W1973923004","https://openalex.org/W1974420955","https://openalex.org/W1974831646","https://openalex.org/W1979566015","https://openalex.org/W1983545421","https://openalex.org/W1986926028","https://openalex.org/W1987232633","https://openalex.org/W1987304299","https://openalex.org/W1988888548","https://openalex.org/W1990846311","https://openalex.org/W1999625132","https://openalex.org/W2001738739","https://openalex.org/W2002549773","https://openalex.org/W2005646196","https://openalex.org/W2008451057","https://openalex.org/W2009470771","https://openalex.org/W2018069366","https://openalex.org/W2026585559","https://openalex.org/W2029171059","https://openalex.org/W2031136586","https://openalex.org/W2032136713","https://openalex.org/W2034295647","https://openalex.org/W2035720033","https://openalex.org/W2037462607","https://openalex.org/W2044062670","https://openalex.org/W2044231720","https://openalex.org/W2048608000","https://openalex.org/W2067699632","https://openalex.org/W2071130955","https://openalex.org/W2072448041","https://openalex.org/W2079942837","https://openalex.org/W2086551443","https://openalex.org/W2090408221","https://openalex.org/W2095703459","https://openalex.org/W2095942479","https://openalex.org/W2098228187","https://openalex.org/W2099089002","https://openalex.org/W2099661831","https://openalex.org/W2099709763","https://openalex.org/W2100932767","https://openalex.org/W2101431901","https://openalex.org/W2101587002","https://openalex.org/W2101903894","https://openalex.org/W2102727118","https://openalex.org/W2105772643","https://openalex.org/W2105864407","https://openalex.org/W2105876415","https://openalex.org/W2106018697","https://openalex.org/W2108730429","https://openalex.org/W2110399624","https://openalex.org/W2110710544","https://openalex.org/W2110723369","https://openalex.org/W2116175063","https://openalex.org/W2116460500","https://openalex.org/W2117299787","https://openalex.org/W2117648153","https://openalex.org/W2120518487","https://openalex.org/W2121118021","https://openalex.org/W2122545654","https://openalex.org/W2123437221","https://openalex.org/W2123608497","https://openalex.org/W2125340270","https://openalex.org/W2125445874","https://openalex.org/W2130392506","https://openalex.org/W2131867938","https://openalex.org/W2132366470","https://openalex.org/W2133393645","https://openalex.org/W2134782496","https://openalex.org/W2136674263","https://openalex.org/W2136798749","https://openalex.org/W2137953999","https://openalex.org/W2140460036","https://openalex.org/W2141242940","https://openalex.org/W2145021036","https://openalex.org/W2145252892","https://openalex.org/W2146921303","https://openalex.org/W2149075803","https://openalex.org/W2150871235","https://openalex.org/W2151290553","https://openalex.org/W2153904572","https://openalex.org/W2155119470","https://openalex.org/W2155410188","https://openalex.org/W2156126318","https://openalex.org/W2158599369","https://openalex.org/W2161036704","https://openalex.org/W2162847528","https://openalex.org/W2164579444","https://openalex.org/W2165606466","https://openalex.org/W2167556016","https://openalex.org/W2169875292","https://openalex.org/W2296006986","https://openalex.org/W2534849208","https://openalex.org/W2535431417","https://openalex.org/W2611087190","https://openalex.org/W3145483441","https://openalex.org/W4244034697","https://openalex.org/W4251549117","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2135470015","https://openalex.org/W2905048389","https://openalex.org/W3012114143","https://openalex.org/W2005952754","https://openalex.org/W2090754905","https://openalex.org/W4247496551","https://openalex.org/W2100788418","https://openalex.org/W1972872690","https://openalex.org/W1567437828","https://openalex.org/W2274823567"],"abstract_inverted_index":{"Multi-core":[0],"and":[1,11,106,141,184,206,220,231,241,261],"many-core":[2,104,151],"systems":[3],"are":[4,12],"the":[5,18,60,128,131,137,172,181,190,211,237,257,269],"norm":[6],"in":[7,66,74,160],"contemporary":[8],"processor":[9],"technology":[10],"expected":[13,65],"to":[14,90,115,134,204,217,224,255],"remain":[15,72],"so":[16],"for":[17,93,149,180,189],"foreseeable":[19],"future.":[20],"Programs":[21],"using":[22,84],"parallel":[23,47],"programming":[24,41],"primitives":[25],"like":[26],"PThreads":[27],"or":[28,51,164],"OpenMP":[29],"often":[30,215],"exploit":[31,117],"coarse-grain":[32,112],"parallelism,":[33],"because":[34],"it":[35],"offers":[36],"a":[37,55,103,150,252],"good":[38],"trade-off":[39],"between":[40,239],"effort":[42,133],"versus":[43],"performance":[44,79,91,167,194,219],"gain.":[45],"Some":[46],"applications":[48,110],"show":[49,147],"limited":[50],"no":[52],"scaling":[53],"beyond":[54],"number":[56,62,258],"of":[57,63,153,162,171,259,268,273],"cores.":[58],"Given":[59],"abundant":[61],"cores":[64,70,85,155],"future":[67],"many-cores,":[68],"several":[69],"would":[71],"idle":[73],"such":[75,227],"cases":[76],"while":[77],"execution":[78],"stagnates.":[80],"This":[81,213],"paper":[82],"proposes":[83],"that":[86,108,201],"do":[87],"not":[88],"contribute":[89],"improvement":[92],"running":[94],"implicit":[95,118,157,242,262],"fine-grain":[96],"speculative":[97,119,125,158],"threads.":[98,274],"In":[99],"particular,":[100],"we":[101,250],"present":[102,251],"architecture":[105],"protocol":[107],"allow":[109],"with":[111,197],"explicit":[113,240,260],"parallelism":[114,120,126,159],"further":[116],"within":[121,266],"each":[122],"thread.":[123],"Implicit":[124],"frees":[127],"programmer":[129],"from":[130],"additional":[132],"explicitly":[135],"partition":[136],"work":[138],"into":[139],"finer":[140],"properly":[142],"synchronized":[143],"tasks.":[144],"Our":[145],"results":[146],"that,":[148],"comprising":[152],"128":[154],"supporting":[156],"clusters":[161],"2":[163],"4":[165],"cores,":[166],"improves":[168],"on":[169,178,187],"top":[170],"highest":[173],"scalability":[174],"point":[175],"by":[176,185],"41%":[177],"average":[179,188],"4-core":[182],"cluster":[183],"27%":[186],"2-core":[191],"cluster.":[192],"These":[193],"improvements":[195],"come":[196],"an":[198],"energy":[199,221],"consumption":[200],"is":[202],"close":[203],"--":[205,210],"sometimes":[207],"better":[208,218],"than":[209],"baseline.":[212],"approach":[214],"leads":[216],"efficiency":[222],"compared":[223],"existing":[225],"alternatives":[226],"as":[228,244],"Core":[229],"Fusion":[230],"Frequency":[232],"Boosting.":[233],"We":[234],"also":[235],"investigate":[236],"tradeoffs":[238],"threads":[243],"input":[245],"dataset":[246],"sizes":[247],"vary.":[248],"Finally,":[249],"dynamic":[253],"mechanism":[254],"choose":[256],"threads,":[263],"which":[264],"performs":[265],"6%":[267],"static":[270],"oracle":[271],"selection":[272]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
