{"id":"https://openalex.org/W2058929932","doi":"https://doi.org/10.1145/2628071.2628093","title":"ILP and TLP in shared memory applications","display_name":"ILP and TLP in shared memory applications","publication_year":2014,"publication_date":"2014-08-21","ids":{"openalex":"https://openalex.org/W2058929932","doi":"https://doi.org/10.1145/2628071.2628093","mag":"2058929932"},"language":"en","primary_location":{"id":"doi:10.1145/2628071.2628093","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2628071.2628093","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd international conference on Parallel architectures and compilation","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056171369","display_name":"Ehsan Fatehi","orcid":null},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ehsan Fatehi","raw_affiliation_strings":["Texas A&amp;M, College Station, TX, USA","Electrical & Computer Engineering, Texas A&M University#TAB#"],"affiliations":[{"raw_affiliation_string":"Texas A&amp;M, College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]},{"raw_affiliation_string":"Electrical & Computer Engineering, Texas A&M University#TAB#","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082578661","display_name":"Paul V. Gratz","orcid":"https://orcid.org/0000-0001-7120-7189"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Paul Gratz","raw_affiliation_strings":["Texas A&amp;M, College Station, TX, USA","Electrical & Computer Engineering, Texas A&M University#TAB#"],"affiliations":[{"raw_affiliation_string":"Texas A&amp;M, College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]},{"raw_affiliation_string":"Electrical & Computer Engineering, Texas A&M University#TAB#","institution_ids":["https://openalex.org/I91045830"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5056171369"],"corresponding_institution_ids":["https://openalex.org/I91045830"],"apc_list":null,"apc_paid":null,"fwci":1.2259,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.79501508,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"113","last_page":"126"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8534286022186279},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.7423418164253235},{"id":"https://openalex.org/keywords/task-parallelism","display_name":"Task parallelism","score":0.6890342831611633},{"id":"https://openalex.org/keywords/instruction-level-parallelism","display_name":"Instruction-level parallelism","score":0.6648021936416626},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6541889309883118},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5927160978317261},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.5405155420303345},{"id":"https://openalex.org/keywords/parsec","display_name":"Parsec","score":0.5268591642379761},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.5037114024162292},{"id":"https://openalex.org/keywords/multithreading","display_name":"Multithreading","score":0.47657108306884766},{"id":"https://openalex.org/keywords/branch-predictor","display_name":"Branch predictor","score":0.46780967712402344},{"id":"https://openalex.org/keywords/speculative-execution","display_name":"Speculative execution","score":0.46660467982292175},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.4487456679344177},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.4402434229850769},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1270405650138855}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8534286022186279},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.7423418164253235},{"id":"https://openalex.org/C42992933","wikidata":"https://www.wikidata.org/wiki/Q691169","display_name":"Task parallelism","level":3,"score":0.6890342831611633},{"id":"https://openalex.org/C140763907","wikidata":"https://www.wikidata.org/wiki/Q2714055","display_name":"Instruction-level parallelism","level":3,"score":0.6648021936416626},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6541889309883118},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5927160978317261},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.5405155420303345},{"id":"https://openalex.org/C44060867","wikidata":"https://www.wikidata.org/wiki/Q12129","display_name":"Parsec","level":3,"score":0.5268591642379761},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.5037114024162292},{"id":"https://openalex.org/C201410400","wikidata":"https://www.wikidata.org/wiki/Q1064412","display_name":"Multithreading","level":3,"score":0.47657108306884766},{"id":"https://openalex.org/C168522837","wikidata":"https://www.wikidata.org/wiki/Q679552","display_name":"Branch predictor","level":2,"score":0.46780967712402344},{"id":"https://openalex.org/C141331961","wikidata":"https://www.wikidata.org/wiki/Q2164465","display_name":"Speculative execution","level":2,"score":0.46660467982292175},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.4487456679344177},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.4402434229850769},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1270405650138855},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C150846664","wikidata":"https://www.wikidata.org/wiki/Q7602306","display_name":"Stars","level":2,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2628071.2628093","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2628071.2628093","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd international conference on Parallel architectures and compilation","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6447108510","display_name":null,"funder_award_id":"CCF-1320074","funder_id":"https://openalex.org/F4320337387","funder_display_name":"Division of Computing and Communication Foundations"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320337387","display_name":"Division of Computing and Communication Foundations","ror":"https://ror.org/01mng8331"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1566481184","https://openalex.org/W1940012472","https://openalex.org/W1958945689","https://openalex.org/W1981663600","https://openalex.org/W2006312753","https://openalex.org/W2025516544","https://openalex.org/W2030680937","https://openalex.org/W2045729716","https://openalex.org/W2079942837","https://openalex.org/W2085598418","https://openalex.org/W2099661831","https://openalex.org/W2105876415","https://openalex.org/W2119393363","https://openalex.org/W2122489278","https://openalex.org/W2126702189","https://openalex.org/W2129192659","https://openalex.org/W2132729131","https://openalex.org/W2133877928","https://openalex.org/W2147657366","https://openalex.org/W2151290553","https://openalex.org/W2156126318","https://openalex.org/W2156619090","https://openalex.org/W2163681909","https://openalex.org/W2169875292","https://openalex.org/W3203992401","https://openalex.org/W4233559994","https://openalex.org/W4246842159","https://openalex.org/W4250378094","https://openalex.org/W6634118119"],"related_works":["https://openalex.org/W1595275176","https://openalex.org/W2408058673","https://openalex.org/W2113960387","https://openalex.org/W2005952754","https://openalex.org/W2135470015","https://openalex.org/W2515308961","https://openalex.org/W2039947876","https://openalex.org/W2045242644","https://openalex.org/W4251785457","https://openalex.org/W2137430026"],"abstract_inverted_index":{"With":[0],"the":[1,12,96,121,134,140,148,153,166,181,214,218],"breakdown":[2],"of":[3,14,38,48,57,66,81,100,124,136,142,156,184,198,216,223],"Dennard":[4],"scaling,":[5],"future":[6,31,49,127],"processor":[7],"designs":[8,21],"will":[9,262],"be":[10,33],"at":[11],"mercy":[13],"power":[15,82],"limits":[16],"as":[17],"Chip":[18],"Multi-Processor":[19],"(CMP)":[20],"scale":[22],"out":[23],"to":[24,43,53,71,77,195],"many-cores.":[25],"It":[26],"is":[27,51,69,147,204],"critical,":[28],"therefore,":[29],"that":[30,126,151,245],"CMPs":[32],"optimally":[34,264],"designed":[35],"in":[36,79],"terms":[37,80],"performance":[39,58,84,125],"efficiency":[40],"with":[41,75,161],"respect":[42,76],"power.":[44],"A":[45],"characterization":[46],"analysis":[47,65],"workloads":[50,68],"imperative":[52],"ensure":[54],"maximum":[55],"returns":[56],"per":[59],"Watt":[60],"consumed.":[61],"Hence,":[62],"a":[63,91,172,196,254],"detailed":[64],"emerging":[67,137],"necessary":[70],"understand":[72],"their":[73],"characteristics":[74],"hardware":[78],"and":[83,111,236],"tradeoffs.":[85],"In":[86],"this":[87],"paper,":[88],"we":[89,189,256],"conduct":[90],"limit":[92],"study":[93,117,150,160],"simultaneously":[94],"analyzing":[95],"two":[97,154],"dominant":[98],"forms":[99,155],"parallelism":[101,157],"exploited":[102],"by":[103],"modern":[104,162],"computer":[105],"architectures:":[106],"Instruction":[107],"Level":[108,113],"Parallelism":[109,114],"(ILP)":[110],"Thread":[112],"(TLP).":[115],"This":[116],"gives":[118],"insights":[119],"into":[120,158,220],"upper":[122],"bounds":[123],"architectures":[128],"can":[129],"achieve.":[130],"Furthermore":[131],"it":[132],"identifies":[133],"bottlenecks":[135],"workloads.":[138],"To":[139],"best":[141],"our":[143,145],"knowledge,":[144],"work":[146,263],"first":[149],"combines":[152],"one":[159,251],"applications.":[163,186],"We":[164,176,211],"evaluate":[165],"PARSEC":[167],"multithreaded":[168],"benchmark":[169],"suite":[170],"using":[171],"specialized":[173],"trace-driven":[174],"simulator.":[175],"make":[177],"several":[178],"contributions":[179],"describing":[180],"high-level":[182],"behavior":[183],"next-generation":[185],"For":[187],"example,":[188],"show":[190,213],"these":[191],"applications":[192],"contain":[193],"up":[194],"factor":[197],"929X":[199],"more":[200],"ILP":[201],"than":[202],"what":[203],"currently":[205],"being":[206],"extracted":[207],"from":[208,250],"real":[209],"machines.":[210],"then":[212],"effects":[215],"breaking":[217],"application":[219],"increasing":[221],"numbers":[222],"threads":[224],"(exploiting":[225],"TLP),":[226],"instruction":[227],"window":[228],"size,":[229],"realistic":[230,233],"branch":[231],"prediction,":[232],"memory":[234],"latency,":[235],"thread":[237],"dependencies":[238],"on":[239],"exploitable":[240],"ILP.":[241],"Our":[242],"examination":[243],"shows":[244],"theses":[246],"benchmarks":[247],"differed":[248],"vastly":[249],"another.":[252],"As":[253],"result,":[255],"expect":[257],"no":[258],"single,":[259],"homogeneous,":[260],"micro-architecture":[261],"for":[265,268],"all,":[266],"arguing":[267],"reconfigurable,":[269],"heterogeneous":[270],"designs.":[271]},"counts_by_year":[{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
