{"id":"https://openalex.org/W2989562079","doi":"https://doi.org/10.1109/tc.2020.2987314","title":"Stream Semantic Registers: A Lightweight RISC-V ISA Extension Achieving Full Compute Utilization in Single-Issue Cores","display_name":"Stream Semantic Registers: A Lightweight RISC-V ISA Extension Achieving Full Compute Utilization in Single-Issue Cores","publication_year":2020,"publication_date":"2020-04-15","ids":{"openalex":"https://openalex.org/W2989562079","doi":"https://doi.org/10.1109/tc.2020.2987314","mag":"2989562079"},"language":"en","primary_location":{"id":"doi:10.1109/tc.2020.2987314","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2020.2987314","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1911.08356","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024145677","display_name":"Fabian Schuiki","orcid":"https://orcid.org/0000-0002-9923-5031"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Fabian Schuiki","raw_affiliation_strings":["Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland","ETH Z\u00fcrich"],"raw_orcid":"https://orcid.org/0000-0002-9923-5031","affiliations":[{"raw_affiliation_string":"Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland","institution_ids":[]},{"raw_affiliation_string":"ETH Z\u00fcrich","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058655278","display_name":"Florian Zaruba","orcid":"https://orcid.org/0000-0002-8194-6521"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Florian Zaruba","raw_affiliation_strings":["Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland","ETH Z\u00fcrich"],"raw_orcid":"https://orcid.org/0000-0002-8194-6521","affiliations":[{"raw_affiliation_string":"Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland","institution_ids":[]},{"raw_affiliation_string":"ETH Z\u00fcrich","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026990786","display_name":"Torsten Hoefler","orcid":"https://orcid.org/0000-0002-1333-9797"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]},{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Torsten Hoefler","raw_affiliation_strings":["Scalable Parallel Computing Laboratory (SPCL), Swiss Federal Institute of Technology, Zurich, Switzerland","ETH Z\u00fcrich"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Scalable Parallel Computing Laboratory (SPCL), Swiss Federal Institute of Technology, Zurich, Switzerland","institution_ids":["https://openalex.org/I5124864"]},{"raw_affiliation_string":"ETH Z\u00fcrich","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043408422","display_name":"Luca Benini","orcid":"https://orcid.org/0000-0001-8068-3806"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]},{"id":"https://openalex.org/I9360294","display_name":"University of Bologna","ror":"https://ror.org/01111rn36","country_code":"IT","type":"education","lineage":["https://openalex.org/I9360294"]}],"countries":["CH","IT"],"is_corresponding":false,"raw_author_name":"Luca Benini","raw_affiliation_strings":["Department of Electrical, Electronic, and Information Engineering (DEI), University of Bologna, Bologna, Italy","Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland","ETH Z\u00fcrich"],"raw_orcid":"https://orcid.org/0000-0001-8068-3806","affiliations":[{"raw_affiliation_string":"Department of Electrical, Electronic, and Information Engineering (DEI), University of Bologna, Bologna, Italy","institution_ids":["https://openalex.org/I9360294"]},{"raw_affiliation_string":"Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland","institution_ids":[]},{"raw_affiliation_string":"ETH Z\u00fcrich","institution_ids":["https://openalex.org/I35440088"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4721,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.56557262,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"70","issue":"2","first_page":"212","last_page":"227"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8449844121932983},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7537055015563965},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6277227997779846},{"id":"https://openalex.org/keywords/register-file","display_name":"Register file","score":0.5373033881187439},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.5128350853919983},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.50244140625},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.47910669445991516},{"id":"https://openalex.org/keywords/loop-tiling","display_name":"Loop tiling","score":0.4598276615142822},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.45230937004089355},{"id":"https://openalex.org/keywords/microarchitecture","display_name":"Microarchitecture","score":0.4199608564376831},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.3282047212123871},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.29880261421203613}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8449844121932983},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7537055015563965},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6277227997779846},{"id":"https://openalex.org/C117280010","wikidata":"https://www.wikidata.org/wiki/Q180944","display_name":"Register file","level":3,"score":0.5373033881187439},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.5128350853919983},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.50244140625},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.47910669445991516},{"id":"https://openalex.org/C11799548","wikidata":"https://www.wikidata.org/wiki/Q6675847","display_name":"Loop tiling","level":3,"score":0.4598276615142822},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.45230937004089355},{"id":"https://openalex.org/C107598950","wikidata":"https://www.wikidata.org/wiki/Q259864","display_name":"Microarchitecture","level":2,"score":0.4199608564376831},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.3282047212123871},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.29880261421203613}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.1109/tc.2020.2987314","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2020.2987314","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1911.08356","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1911.08356","pdf_url":"https://arxiv.org/pdf/1911.08356","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:www.research-collection.ethz.ch:20.500.11850/450549","is_oa":true,"landing_page_url":"http://hdl.handle.net/20.500.11850/450549","pdf_url":null,"source":{"id":"https://openalex.org/S4306402302","display_name":"Repository for Publications and Research Data (ETH Zurich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I35440088","host_organization_name":"ETH Zurich","host_organization_lineage":["https://openalex.org/I35440088"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Transactions on Computers, 70 (2)","raw_type":"info:eu-repo/semantics/acceptedVersion"},{"id":"doi:10.48550/arxiv.1911.08356","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1911.08356","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"doi:10.3929/ethz-b-000450549","is_oa":true,"landing_page_url":"https://doi.org/10.3929/ethz-b-000450549","pdf_url":null,"source":{"id":"https://openalex.org/S7407051236","display_name":"ETH Z\u00fcrich Research Collection","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"},{"id":"mag:2989562079","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1911.08356","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1911.08356","pdf_url":"https://arxiv.org/pdf/1911.08356","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.9100000262260437,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G1689260938","display_name":null,"funder_award_id":"732631 OPRECOMP","funder_id":"https://openalex.org/F4320332999","funder_display_name":"Horizon 2020 Framework Programme"}],"funders":[{"id":"https://openalex.org/F4320332999","display_name":"Horizon 2020 Framework Programme","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W127009360","https://openalex.org/W1518148158","https://openalex.org/W1555915743","https://openalex.org/W1571230620","https://openalex.org/W1871211636","https://openalex.org/W1879667491","https://openalex.org/W1956142535","https://openalex.org/W1970227175","https://openalex.org/W1988374166","https://openalex.org/W2003313945","https://openalex.org/W2011316624","https://openalex.org/W2034402701","https://openalex.org/W2058234234","https://openalex.org/W2078726412","https://openalex.org/W2127609451","https://openalex.org/W2131081741","https://openalex.org/W2153185479","https://openalex.org/W2159182073","https://openalex.org/W2282593638","https://openalex.org/W2345737886","https://openalex.org/W2761412899","https://openalex.org/W2763302904","https://openalex.org/W2845210056","https://openalex.org/W2902058806","https://openalex.org/W2936567838","https://openalex.org/W2945751418","https://openalex.org/W2947567876","https://openalex.org/W2953184160","https://openalex.org/W2963255460","https://openalex.org/W2963566954","https://openalex.org/W2963688890","https://openalex.org/W2994193159","https://openalex.org/W3004856113","https://openalex.org/W4246166885","https://openalex.org/W6670341109","https://openalex.org/W6733468875","https://openalex.org/W6761085593","https://openalex.org/W6987020231","https://openalex.org/W6999016131"],"related_works":["https://openalex.org/W2915415779","https://openalex.org/W3036126610","https://openalex.org/W2304177525","https://openalex.org/W2003402359","https://openalex.org/W1973875862","https://openalex.org/W2218720528","https://openalex.org/W2038679012","https://openalex.org/W2767149022","https://openalex.org/W2066023578","https://openalex.org/W2087619620","https://openalex.org/W2936814528","https://openalex.org/W2610229489","https://openalex.org/W2413117826","https://openalex.org/W1530752073","https://openalex.org/W3159607817","https://openalex.org/W2025480814","https://openalex.org/W1988625252","https://openalex.org/W2372831926","https://openalex.org/W2127673258","https://openalex.org/W2164287667"],"abstract_inverted_index":{"Single-issue":[0],"processor":[1],"cores":[2,141],"are":[3,142],"very":[4],"energy":[5,60,164],"efficient":[6],"but":[7],"suffer":[8],"from":[9],"the":[10,22,86,90,99,149,198,202],"von":[11],"Neumann":[12],"bottleneck,":[13],"in":[14,89,126,144,159,167],"that":[15],"they":[16],"must":[17],"explicitly":[18],"fetch":[19],"and":[20,58,97,138,180],"issue":[21],"loads/storse":[23],"necessary":[24],"to":[25,45,55,113,147,155,161,178,187,195,201],"feed":[26],"their":[27],"ALU/FPU.":[28],"Each":[29],"instruction":[30,174,181],"spent":[31,39],"on":[32,40,48,134],"moving":[33],"data":[34],"is":[35,63],"a":[36,64,79,102,110,121,135,145,162,168],"cycle":[37],"not":[38],"computation,":[41],"limiting":[42],"ALU/FPU":[43],"utilization":[44,57,153],"33":[46],"percent":[47,124,158],"reductions.":[49],"We":[50,84],"propose":[51],"\u201cStream":[52],"Semantic":[53],"Registers\u201d":[54],"boost":[56],"increase":[59,125,154],"efficiency.":[61],"SSR":[62],"lightweight,":[65],"non-invasive":[66],"RISC-V":[67],"ISA":[68],"extension":[69,88,108,172],"which":[70],"implicitly":[71],"encodes":[72],"memory":[73],"accesses":[74],"as":[75],"register":[76],"reads/writes,":[77],"eliminating":[78],"large":[80],"number":[81],"of":[82,92],"loads/stores.":[83],"implement":[85],"proposed":[87],"RTL":[91],"an":[93],"existing":[94],"multi-core":[95,169],"cluster":[96,146],"synthesize":[98],"design":[100],"for":[101],"modern":[103],"22":[104],"nm":[105],"technology.":[106],"Our":[107],"provides":[109],"significant,":[111],"2x":[112,163],"5x,":[114],"architectural":[115],"speedup":[116],"across":[117],"different":[118],"kernels":[119],"at":[120],"small":[122],"11":[123],"core":[127],"area.":[128],"Sequential":[129],"code":[130],"runs":[131],"3x":[132,139],"faster":[133],"single":[136],"core,":[137],"fewer":[140],"needed":[143],"achieve":[148],"same":[150],"performance.":[151],"The":[152,171],"almost":[156],"100":[157],"leads":[160],"efficiency":[165],"improvement":[166],"cluster.":[170],"reduces":[173],"fetches":[175],"by":[176,185],"up":[177,186],"3.5x":[179],"cache":[182],"power":[183],"consumption":[184],"5.6x.":[188],"Compilers":[189],"can":[190],"automatically":[191],"map":[192],"loop":[193],"nests":[194],"SSRs,":[196],"making":[197],"changes":[199],"transparent":[200],"programmer.":[203]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
