{"id":"https://openalex.org/W4230737732","doi":"https://doi.org/10.1109/micro.2016.7783752","title":"Chainsaw: Von-neumann accelerators to leverage fused instruction chains","display_name":"Chainsaw: Von-neumann accelerators to leverage fused instruction chains","publication_year":2016,"publication_date":"2016-10-01","ids":{"openalex":"https://openalex.org/W4230737732","doi":"https://doi.org/10.1109/micro.2016.7783752"},"language":"en","primary_location":{"id":"doi:10.1109/micro.2016.7783752","is_oa":false,"landing_page_url":"https://doi.org/10.1109/micro.2016.7783752","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 49th Annual IEEE/ACM International Symposium on Microarchitecture (MICRO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040436347","display_name":"Amirali Sharifian","orcid":null},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Amirali Sharifian","raw_affiliation_strings":["School of Computing Science, Simon Fraser University"],"affiliations":[{"raw_affiliation_string":"School of Computing Science, Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016747898","display_name":"Snehasish Kumar","orcid":null},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Snehasish Kumar","raw_affiliation_strings":["School of Computing Science, Simon Fraser University"],"affiliations":[{"raw_affiliation_string":"School of Computing Science, Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113856709","display_name":"Apala Guha","orcid":null},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Apala Guha","raw_affiliation_strings":["School of Computing Science, Simon Fraser University"],"affiliations":[{"raw_affiliation_string":"School of Computing Science, Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035046431","display_name":"Arrvindh Shriraman","orcid":"https://orcid.org/0000-0001-8466-5701"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Arrvindh Shriraman","raw_affiliation_strings":["School of Computing Science, Simon Fraser University"],"affiliations":[{"raw_affiliation_string":"School of Computing Science, Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5040436347"],"corresponding_institution_ids":["https://openalex.org/I18014758"],"apc_list":null,"apc_paid":null,"fwci":1.44623318,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.85070885,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"33","issue":null,"first_page":"1","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8400643467903137},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7686952352523804},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.7567025423049927},{"id":"https://openalex.org/keywords/microarchitecture","display_name":"Microarchitecture","score":0.6990726590156555},{"id":"https://openalex.org/keywords/very-long-instruction-word","display_name":"Very long instruction word","score":0.6788003444671631},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.6714884042739868},{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.6585155129432678},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6164222955703735},{"id":"https://openalex.org/keywords/von-neumann-architecture","display_name":"Von Neumann architecture","score":0.5993699431419373},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.47324854135513306},{"id":"https://openalex.org/keywords/code-generation","display_name":"Code generation","score":0.44914087653160095},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.44835859537124634},{"id":"https://openalex.org/keywords/instruction-scheduling","display_name":"Instruction scheduling","score":0.446916401386261},{"id":"https://openalex.org/keywords/operand","display_name":"Operand","score":0.43927374482154846},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.4265035390853882},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.4109760522842407},{"id":"https://openalex.org/keywords/register-file","display_name":"Register file","score":0.41031086444854736},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.36802300810813904},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.19198191165924072},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.18444624543190002},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.18406176567077637},{"id":"https://openalex.org/keywords/schedule","display_name":"Schedule","score":0.12751618027687073}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8400643467903137},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7686952352523804},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.7567025423049927},{"id":"https://openalex.org/C107598950","wikidata":"https://www.wikidata.org/wiki/Q259864","display_name":"Microarchitecture","level":2,"score":0.6990726590156555},{"id":"https://openalex.org/C170595534","wikidata":"https://www.wikidata.org/wiki/Q249743","display_name":"Very long instruction word","level":2,"score":0.6788003444671631},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.6714884042739868},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.6585155129432678},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6164222955703735},{"id":"https://openalex.org/C80469333","wikidata":"https://www.wikidata.org/wiki/Q189088","display_name":"Von Neumann architecture","level":2,"score":0.5993699431419373},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.47324854135513306},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.44914087653160095},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.44835859537124634},{"id":"https://openalex.org/C73564150","wikidata":"https://www.wikidata.org/wiki/Q11417093","display_name":"Instruction scheduling","level":5,"score":0.446916401386261},{"id":"https://openalex.org/C55526617","wikidata":"https://www.wikidata.org/wiki/Q719375","display_name":"Operand","level":2,"score":0.43927374482154846},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.4265035390853882},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4109760522842407},{"id":"https://openalex.org/C117280010","wikidata":"https://www.wikidata.org/wiki/Q180944","display_name":"Register file","level":3,"score":0.41031086444854736},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.36802300810813904},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.19198191165924072},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.18444624543190002},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.18406176567077637},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.12751618027687073},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0},{"id":"https://openalex.org/C107568181","wikidata":"https://www.wikidata.org/wiki/Q5319000","display_name":"Dynamic priority scheduling","level":3,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C119948110","wikidata":"https://www.wikidata.org/wiki/Q7858726","display_name":"Two-level scheduling","level":4,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/micro.2016.7783752","is_oa":false,"landing_page_url":"https://doi.org/10.1109/micro.2016.7783752","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 49th Annual IEEE/ACM International Symposium on Microarchitecture (MICRO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.8999999761581421}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W1484728941","https://openalex.org/W1964471912","https://openalex.org/W1968415593","https://openalex.org/W1969529818","https://openalex.org/W1969816685","https://openalex.org/W1970227175","https://openalex.org/W1975489482","https://openalex.org/W1985856855","https://openalex.org/W1988521690","https://openalex.org/W2000321331","https://openalex.org/W2013281054","https://openalex.org/W2022632182","https://openalex.org/W2035924020","https://openalex.org/W2093621020","https://openalex.org/W2101134669","https://openalex.org/W2101536355","https://openalex.org/W2111394443","https://openalex.org/W2112495948","https://openalex.org/W2116267755","https://openalex.org/W2122171990","https://openalex.org/W2130408605","https://openalex.org/W2130766965","https://openalex.org/W2134218813","https://openalex.org/W2134633067","https://openalex.org/W2150947797","https://openalex.org/W2164264749","https://openalex.org/W2167556016","https://openalex.org/W2170382128","https://openalex.org/W2171697422","https://openalex.org/W2205217824","https://openalex.org/W2239947352","https://openalex.org/W2319625707","https://openalex.org/W2544732887","https://openalex.org/W4231250608","https://openalex.org/W4234024706","https://openalex.org/W4236272793","https://openalex.org/W4236433846","https://openalex.org/W6647713351","https://openalex.org/W6675115123","https://openalex.org/W6679595550","https://openalex.org/W6813102376"],"related_works":["https://openalex.org/W2059502833","https://openalex.org/W89872709","https://openalex.org/W2581286023","https://openalex.org/W2502878968","https://openalex.org/W2387572761","https://openalex.org/W2054117411","https://openalex.org/W2049097986","https://openalex.org/W2357256492","https://openalex.org/W3022819336","https://openalex.org/W4248406484"],"abstract_inverted_index":{"A":[0],"central":[1],"tenet":[2],"behind":[3],"accelerators":[4,68],"is":[5,30,44,83,123,195,241],"to":[6,65,137,187,219,260],"partition":[7],"a":[8,41,56,97,157,196,227,238,261],"program":[9,222],"execution":[10,181],"into":[11,156],"regions":[12],"with":[13,72],"different":[14,138],"behavior":[15],"(e.g.,":[16,109],"SIMD,":[17],"Irregular,":[18],"Compute-Intensive)":[19],"and":[20,75,101,148,183,204,232,235],"then":[21,171],"use":[22],"behavior-specialized":[23],"architectures":[24],"[1]":[25],"for":[26,46],"each":[27],"region.":[28],"It":[29],"unclear":[31],"whether":[32],"the":[33,47,52,79,85,106,116,124,143,146,149,161,168,179,189,245,254],"gains":[34],"in":[35],"efficiency":[36],"arise":[37],"from":[38],"recognizing":[39],"that":[40,103,153,237],"simpler":[42],"microarchitecture":[43],"sufficient":[45],"acceleratable":[48],"code":[49],"region":[50],"or":[51,55],"actual":[53],"microarchitecture,":[54],"combination":[57],"of":[58,105,126,133,145,151,244,247],"both.":[59],"Many":[60],"proposals":[61],"[2],":[62],"[3]":[63],"seem":[64],"choose":[66],"dataflow-based":[67],"which":[69,128,167],"encounters":[70],"challenges":[71],"fabric":[73],"utilization":[74],"static":[76],"power":[77],"when":[78],"available":[80,89],"instruction":[81,118],"parallelism":[82,88],"below":[84],"peak":[86],"operation":[87],"[4].":[90],"In":[91],"this":[92],"paper,":[93],"we":[94],"develop,":[95],"Chainsaw,":[96],"Von-Neumann":[98],"based":[99],"accelerator":[100],"demonstrate":[102],"many":[104],"fundamental":[107],"overheads":[108],"fetch-decode)":[110],"can":[111,214],"be":[112,215],"amortized":[113],"by":[114,141,173,257],"adopting":[115],"appropriate":[117],"abstraction.":[119],"The":[120],"key":[121],"insight":[122],"notion":[125],"chains,":[127],"are":[129,154],"compiler":[130,230],"fused":[131,155],"sequences":[132],"instructions.":[134],"chains":[135,147],"adapt":[136],"acceleration":[139],"behaviors":[140],"varying":[142],"length":[144],"types":[150],"instructions":[152],"chain.":[158],"Chains":[159],"convey":[160],"producer-consumer":[162],"locality":[163],"between":[164,191],"dependent":[165,192],"instructions,":[166],"Chainsaw":[169,194,240],"architecture":[170,199],"captures":[172],"temporally":[174],"scheduling":[175],"such":[176],"operations":[177],"on":[178],"same":[180],"unit":[182],"uses":[184],"pipeline":[185,201],"registers":[186],"forward":[188],"values":[190],"operations.":[193],"generic":[197],"multi-lane":[198],"(4-stage":[200],"per":[202],"lane)":[203],"does":[205],"not":[206],"require":[207],"any":[208],"specialized":[209],"compound":[210],"function":[211],"units;":[212],"it":[213,218],"reloaded":[216],"enabling":[217],"accelerate":[220],"multiple":[221],"paths.":[223],"We":[224],"have":[225],"developed":[226],"complete":[228],"LLVM-based":[229],"prototype":[231],"simulation":[233],"infrastructure":[234],"demonstrated":[236],"8-lane":[239],"within":[242],"73%":[243],"performance":[246],"an":[248],"ideal":[249],"dataflow":[250],"architecture,":[251],"while":[252],"reducing":[253],"energy":[255],"consumption":[256],"45%":[258],"compared":[259],"4-way":[262],"OOO":[263],"processor.":[264]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
