{"id":"https://openalex.org/W2166282436","doi":"https://doi.org/10.1109/iccd.2007.4601890","title":"Cluster-level simultaneous multithreading for VLIW processors","display_name":"Cluster-level simultaneous multithreading for VLIW processors","publication_year":2007,"publication_date":"2007-10-01","ids":{"openalex":"https://openalex.org/W2166282436","doi":"https://doi.org/10.1109/iccd.2007.4601890","mag":"2166282436"},"language":"en","primary_location":{"id":"doi:10.1109/iccd.2007.4601890","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccd.2007.4601890","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 25th International Conference on Computer Design","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013381682","display_name":"Manoj Gupta","orcid":"https://orcid.org/0000-0002-4274-4927"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Manoj Gupta","raw_affiliation_strings":["Department of Computer Architecture, Universitat Politecnica de Catalunya, Spain"],"affiliations":[{"raw_affiliation_string":"Department of Computer Architecture, Universitat Politecnica de Catalunya, Spain","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039060971","display_name":"Ferm\u00edn S\u00e1nchez Carracedo","orcid":"https://orcid.org/0000-0001-6954-7643"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Fermin Sanchez","raw_affiliation_strings":["Department of Computer Architecture, Universitat Politecnica de Catalunya, Spain"],"affiliations":[{"raw_affiliation_string":"Department of Computer Architecture, Universitat Politecnica de Catalunya, Spain","institution_ids":["https://openalex.org/I9617848"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5013381682"],"corresponding_institution_ids":["https://openalex.org/I9617848"],"apc_list":null,"apc_paid":null,"fwci":1.5883,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.84967508,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"121","last_page":"128"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/very-long-instruction-word","display_name":"Very long instruction word","score":0.9031137228012085},{"id":"https://openalex.org/keywords/multithreading","display_name":"Multithreading","score":0.867810845375061},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8541121482849121},{"id":"https://openalex.org/keywords/simultaneous-multithreading","display_name":"Simultaneous multithreading","score":0.7834223508834839},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.7610064148902893},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7557801008224487},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7448530197143555},{"id":"https://openalex.org/keywords/instruction-level-parallelism","display_name":"Instruction-level parallelism","score":0.6250054836273193},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.6224736571311951},{"id":"https://openalex.org/keywords/yarn","display_name":"Yarn","score":0.4305962324142456},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.2439800500869751},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.14387446641921997}],"concepts":[{"id":"https://openalex.org/C170595534","wikidata":"https://www.wikidata.org/wiki/Q249743","display_name":"Very long instruction word","level":2,"score":0.9031137228012085},{"id":"https://openalex.org/C201410400","wikidata":"https://www.wikidata.org/wiki/Q1064412","display_name":"Multithreading","level":3,"score":0.867810845375061},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8541121482849121},{"id":"https://openalex.org/C85717602","wikidata":"https://www.wikidata.org/wiki/Q82178","display_name":"Simultaneous multithreading","level":4,"score":0.7834223508834839},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.7610064148902893},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7557801008224487},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7448530197143555},{"id":"https://openalex.org/C140763907","wikidata":"https://www.wikidata.org/wiki/Q2714055","display_name":"Instruction-level parallelism","level":3,"score":0.6250054836273193},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.6224736571311951},{"id":"https://openalex.org/C2778787235","wikidata":"https://www.wikidata.org/wiki/Q49007","display_name":"Yarn","level":2,"score":0.4305962324142456},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.2439800500869751},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.14387446641921997},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iccd.2007.4601890","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccd.2007.4601890","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 25th International Conference on Computer Design","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.599.7893","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.599.7893","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://mgupta.pc.ac.upc.edu/homepage/papers/iccd2007.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.41999998688697815,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W70437322","https://openalex.org/W1804655954","https://openalex.org/W2040167141","https://openalex.org/W2056497280","https://openalex.org/W2066670963","https://openalex.org/W2081040934","https://openalex.org/W2084451631","https://openalex.org/W2095950905","https://openalex.org/W2105555051","https://openalex.org/W2116903748","https://openalex.org/W2117285153","https://openalex.org/W2120230074","https://openalex.org/W2129962996","https://openalex.org/W2145303974","https://openalex.org/W2148051985","https://openalex.org/W2154055780","https://openalex.org/W2154348160","https://openalex.org/W2156007977","https://openalex.org/W2160401437","https://openalex.org/W2169229905","https://openalex.org/W2576288252","https://openalex.org/W3142147837","https://openalex.org/W3144732534","https://openalex.org/W3147835733","https://openalex.org/W4251803368","https://openalex.org/W4298376790","https://openalex.org/W6677504465","https://openalex.org/W6682005402","https://openalex.org/W6793159789"],"related_works":["https://openalex.org/W2224540060","https://openalex.org/W2107657843","https://openalex.org/W2161257244","https://openalex.org/W2128998116","https://openalex.org/W2105594083","https://openalex.org/W2166282436","https://openalex.org/W1897551170","https://openalex.org/W1580653297","https://openalex.org/W2133675875","https://openalex.org/W3187804951"],"abstract_inverted_index":{"Clustered":[0],"VLIW":[1,92,124,182],"embedded":[2],"processors":[3,93],"have":[4,35],"become":[5],"widespread":[6],"due":[7],"to":[8,84,122],"benefits":[9],"of":[10,23,88,104,177],"simple":[11,141],"hardware":[12,96],"and":[13,28,98,184,204],"low":[14],"power.":[15],"However,":[16,67],"while":[17],"some":[18,86,191],"applications":[19],"exhibit":[20],"large":[21],"amounts":[22],"instruction":[24,64,125],"level":[25,60],"parallelism":[26,61],"(ILP)":[27],"benefit":[29],"from":[30,126],"very":[31,140],"wide":[32,43],"machines,":[33],"others":[34],"little":[36],"ILP,":[37],"which":[38],"wastes":[39],"precious":[40],"resources":[41],"in":[42,90,109],"processors.":[44],"Simultaneous":[45],"multithreading":[46,162,188],"(SMT)":[47],"is":[48,147],"a":[49,110,123,127,139,180],"well":[50],"known":[51],"technique":[52],"that":[53,106,153],"improves":[54,156],"resource":[55],"utilization":[56],"by":[57],"exploiting":[58],"thread":[59,129,202],"at":[62],"the":[63,102,116],"grain":[65],"level.":[66],"implementing":[68],"SMT":[69,89],"for":[70,165],"VLIWs":[71],"requires":[72],"complex":[73],"structures.":[74],"In":[75,190],"this":[76],"paper,":[77],"we":[78],"propose":[79],"CSMT":[80,100,154,172],"(cluster-level":[81],"simultaneous":[82],"multithreading)":[83],"allow":[85],"degree":[87],"clustered":[91],"with":[94,160,169],"minimal":[95],"cost":[97],"complexity.":[99],"considers":[101],"set":[103],"operations":[105],"execute":[107],"simultaneously":[108],"given":[111,128],"cluster":[112,135,144],"(named":[113],"bundle)":[114],"as":[115,196,198],"assignment":[117],"unit.":[118],"All":[119],"bundles":[120],"belonging":[121],"are":[130],"issued":[131],"simultaneously.":[132],"To":[133],"minimize":[134],"conflicts":[136],"between":[137],"threads,":[138],"hardware-":[142],"based":[143],"renaming":[145],"mechanism":[146],"proposed.":[148],"The":[149],"experimental":[150],"results":[151],"show":[152],"significantly":[155],"ILP":[157],"when":[158],"compared":[159],"other":[161],"approaches":[163],"suited":[164],"VLIW.":[166],"For":[167],"instance,":[168],"4":[170],"threads":[171],"shows":[173],"an":[174],"average":[175],"speedup":[176,193],"113%":[178],"over":[179,186,200,206],"single-thread":[181],"architecture":[183,203],"36%":[185],"interleaved":[187],"(IMT).":[189],"cases,":[192],"can":[194],"be":[195],"high":[197],"228%":[199],"single":[201],"97%":[205],"IMT.":[207]},"counts_by_year":[{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
