{"id":"https://openalex.org/W3013692244","doi":"https://doi.org/10.1109/tc.2020.3027900","title":"Snitch: A Tiny Pseudo Dual-Issue Processor for Area and Energy Efficient Execution of Floating-Point Intensive Workloads","display_name":"Snitch: A Tiny Pseudo Dual-Issue Processor for Area and Energy Efficient Execution of Floating-Point Intensive Workloads","publication_year":2020,"publication_date":"2020-10-07","ids":{"openalex":"https://openalex.org/W3013692244","doi":"https://doi.org/10.1109/tc.2020.3027900","mag":"3013692244"},"language":"en","primary_location":{"id":"doi:10.1109/tc.2020.3027900","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2020.3027900","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2002.10143","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058655278","display_name":"Florian Zaruba","orcid":"https://orcid.org/0000-0002-8194-6521"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Florian Zaruba","raw_affiliation_strings":["Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0002-8194-6521","affiliations":[{"raw_affiliation_string":"Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024145677","display_name":"Fabian Schuiki","orcid":"https://orcid.org/0000-0002-9923-5031"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fabian Schuiki","raw_affiliation_strings":["Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0002-9923-5031","affiliations":[{"raw_affiliation_string":"Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026990786","display_name":"Torsten Hoefler","orcid":"https://orcid.org/0000-0002-1333-9797"},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Torsten Hoefler","raw_affiliation_strings":["Scalable Parallel Computing Laboratory (SPCL), Swiss Federal Institute of Technology, Zurich, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Scalable Parallel Computing Laboratory (SPCL), Swiss Federal Institute of Technology, Zurich, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043408422","display_name":"Luca Benini","orcid":"https://orcid.org/0000-0001-8068-3806"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luca Benini","raw_affiliation_strings":["Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0001-8068-3806","affiliations":[{"raw_affiliation_string":"Integrated Systems Laboratory (IIS), Swiss Federal Institute of Technology, Zurich, Switzerland","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":8.4973,"has_fulltext":false,"cited_by_count":89,"citation_normalized_percentile":{"value":0.98267362,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"70","issue":"11","first_page":"1845","last_page":"1860"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8209357857704163},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6639872789382935},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5317802429199219},{"id":"https://openalex.org/keywords/floating-point","display_name":"Floating point","score":0.5271584391593933},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.49279263615608215},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.484347939491272},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.4423273801803589},{"id":"https://openalex.org/keywords/control-flow","display_name":"Control flow","score":0.4371473491191864},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.4339959919452667},{"id":"https://openalex.org/keywords/register-file","display_name":"Register file","score":0.41385558247566223},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3777419626712799},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3327902555465698},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.3243313431739807},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2840229868888855},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1436665654182434}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8209357857704163},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6639872789382935},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5317802429199219},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.5271584391593933},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.49279263615608215},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.484347939491272},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.4423273801803589},{"id":"https://openalex.org/C160191386","wikidata":"https://www.wikidata.org/wiki/Q868299","display_name":"Control flow","level":2,"score":0.4371473491191864},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.4339959919452667},{"id":"https://openalex.org/C117280010","wikidata":"https://www.wikidata.org/wiki/Q180944","display_name":"Register file","level":3,"score":0.41385558247566223},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3777419626712799},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3327902555465698},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3243313431739807},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2840229868888855},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1436665654182434},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tc.2020.3027900","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2020.3027900","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2002.10143","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2002.10143","pdf_url":"https://arxiv.org/pdf/2002.10143","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:cris.unibo.it:11585/869643","is_oa":false,"landing_page_url":"http://hdl.handle.net/11585/869643","pdf_url":null,"source":{"id":"https://openalex.org/S4306402579","display_name":"Archivio istituzionale della ricerca (Alma Mater Studiorum Universit\u00e0 di Bologna)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210117483","host_organization_name":"Istituto di Ematologia di Bologna","host_organization_lineage":["https://openalex.org/I4210117483"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2002.10143","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2002.10143","pdf_url":"https://arxiv.org/pdf/2002.10143","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.9100000262260437,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G5339339394","display_name":null,"funder_award_id":"732631","funder_id":"https://openalex.org/F4320332999","funder_display_name":"Horizon 2020 Framework Programme"}],"funders":[{"id":"https://openalex.org/F4320332999","display_name":"Horizon 2020 Framework Programme","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W1555915743","https://openalex.org/W1988374166","https://openalex.org/W2089899129","https://openalex.org/W2095858451","https://openalex.org/W2144481293","https://openalex.org/W2153331583","https://openalex.org/W2165384099","https://openalex.org/W2334795732","https://openalex.org/W2520759911","https://openalex.org/W2613264175","https://openalex.org/W2796649226","https://openalex.org/W2798482670","https://openalex.org/W2809679348","https://openalex.org/W2935480346","https://openalex.org/W2936567838","https://openalex.org/W2947567876","https://openalex.org/W2963255460","https://openalex.org/W2963566954","https://openalex.org/W2982497812","https://openalex.org/W2989562079","https://openalex.org/W2992291612","https://openalex.org/W2994193159","https://openalex.org/W3015851914","https://openalex.org/W3016309475","https://openalex.org/W3092000444","https://openalex.org/W3123542955","https://openalex.org/W4297778246","https://openalex.org/W6750448596","https://openalex.org/W6750694976","https://openalex.org/W6763190703","https://openalex.org/W6999016131"],"related_works":["https://openalex.org/W2771613338","https://openalex.org/W4239584669","https://openalex.org/W2188516702","https://openalex.org/W2045555750","https://openalex.org/W4250432526","https://openalex.org/W788524553","https://openalex.org/W2101536355","https://openalex.org/W2009783759","https://openalex.org/W2039538849","https://openalex.org/W4245282684"],"abstract_inverted_index":{"Data-parallel":[0],"applications,":[1],"such":[2],"as":[3,75,159],"data":[4],"analytics,":[5],"machine":[6],"learning,":[7],"and":[8,49,116,144,173,193,202,242,261],"scientific":[9],"computing,":[10],"are":[11,47],"placing":[12],"an":[13,58,246],"ever-growing":[14],"demand":[15],"on":[16,21,190,245,269],"floating-point":[17,99,119,146,172],"operations":[18],"per":[19],"second":[20],"emerging":[22],"systems.":[23],"With":[24],"increasing":[25],"integration":[26],"density,":[27],"the":[28,34,63,104,133,152,171,188,191,239],"quest":[29],"for":[30,197],"energy":[31,44,68,267],"efficiency":[32,69,268],"becomes":[33],"number":[35],"one":[36],"design":[37],"concern.":[38],"While":[39,109],"dedicated":[40],"accelerators":[41],"provide":[42],"high":[43,73,118],"efficiency,":[45],"they":[46],"over-specialized":[48],"hard":[50],"to":[51,53,84,102,106,154],"adjust":[52,103],"algorithmic":[54],"changes.":[55],"We":[56,236,253],"propose":[57],"architectural":[59],"concept":[60],"that":[61],"tackles":[62],"issues":[64],"of":[65,211],"achieving":[66,117,230],"extreme":[67],"while":[70],"still":[71],"maintaining":[72],"flexibility":[74],"a":[76,86,97,123,145,180,207,225,231,262],"general-purpose":[77],"compute":[78,105],"engine.":[79],"The":[80,167,214],"key":[81],"idea":[82],"is":[83],"pair":[85],"tiny":[87],"10kGE":[88],"(kilo":[89],"gate":[90],"equivalent)":[91],"control":[92,107],"core,":[93],"called":[94],"Snitch,":[95,126],"with":[96,125,135],"double-precision":[98],"unit":[100,113],"(FPU)":[101,114],"ratio.":[108],"traditionally":[110],"minimizing":[111],"non-floating-point":[112],"area":[115],"utilization":[120],"has":[121],"been":[122],"trade-off,":[124],"we":[127],"achieve":[128,254],"them":[129],"both,":[130],"by":[131,176],"enhancing":[132],"ISA":[134,184,218,243],"two":[136,215],"minimally":[137],"intrusive":[138],"extensions:":[139],"stream":[140],"semantic":[141],"registers":[142],"(SSR)":[143],"repetition":[147],"instruction":[148],"(FREP).":[149],"SSRs":[150],"allow":[151],"core":[153,192,241],"implicitly":[155],"encode":[156],"load/store":[157],"instructions":[158,178],"register":[160],"reads/writes,":[161],"eliding":[162],"many":[163],"explicit":[164],"memory":[165],"instructions.":[166],"FREP":[168],"extension":[169],"decouples":[170],"integer":[174],"pipeline":[175],"sequencing":[177],"from":[179],"micro-loop":[181],"buffer.":[182],"These":[183],"extensions":[185,219,244],"significantly":[186],"reduce":[187],"pressure":[189],"free":[194],"it":[195],"up":[196],"other":[198],"tasks,":[199],"making":[200],"Snitch":[201,221],"FPU":[203],"effectively":[204],"dual-issue":[205],"at":[206],"minimal":[208],"incremental":[209],"cost":[210],"3.2":[212],"percent.":[213],"low":[216],"overhead":[217],"make":[220],"more":[222,255],"flexible":[223],"than":[224,256],"contemporary":[226],"vector":[227],"processor":[228],"lane,":[229],"<inline-formula><tex-math":[232,257,263],"notation=\"LaTeX\">$2\\times$</tex-math></inline-formula>":[233],"energy-efficiency":[234],"improvement.":[235],"have":[237],"evaluated":[238],"proposed":[240],"octa-core":[247],"cluster":[248],"in":[249,266],"22":[250],"nm":[251],"technology.":[252],"notation=\"LaTeX\">$6\\times$</tex-math></inline-formula>":[258],"multi-core":[259],"speed-up":[260],"notation=\"LaTeX\">$3.5\\times$</tex-math></inline-formula>":[264],"gain":[265],"several":[270],"parallel":[271],"microkernels.":[272]},"counts_by_year":[{"year":2026,"cited_by_count":8},{"year":2025,"cited_by_count":30},{"year":2024,"cited_by_count":15},{"year":2023,"cited_by_count":12},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":12},{"year":2020,"cited_by_count":6}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2020-04-03T00:00:00"}
