{"id":"https://openalex.org/W2144928940","doi":"https://doi.org/10.1109/isqed.2008.4479831","title":"Amplifying Embedded System Efficiency via Automatic Instruction Fusion on a Post-Manufacturing Reconfigurable Architecture Platform","display_name":"Amplifying Embedded System Efficiency via Automatic Instruction Fusion on a Post-Manufacturing Reconfigurable Architecture Platform","publication_year":2008,"publication_date":"2008-03-01","ids":{"openalex":"https://openalex.org/W2144928940","doi":"https://doi.org/10.1109/isqed.2008.4479831","mag":"2144928940"},"language":"en","primary_location":{"id":"doi:10.1109/isqed.2008.4479831","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isqed.2008.4479831","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"9th International Symposium on Quality Electronic Design (isqed 2008)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113105093","display_name":"Allen C. Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I170201317","display_name":"University of Pittsburgh","ror":"https://ror.org/01an3r305","country_code":"US","type":"education","lineage":["https://openalex.org/I170201317"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Allen C. Cheng","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Pittsburgh, Pittsburgh, PA, USA","Univ. of Pittsburgh, Pittsburgh"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Pittsburgh, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I170201317"]},{"raw_affiliation_string":"Univ. of Pittsburgh, Pittsburgh","institution_ids":["https://openalex.org/I170201317"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5113105093"],"corresponding_institution_ids":["https://openalex.org/I170201317"],"apc_list":null,"apc_paid":null,"fwci":0.3466,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.70684014,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"744","last_page":"749"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7621069550514221},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.6834968328475952},{"id":"https://openalex.org/keywords/application-specific-integrated-circuit","display_name":"Application-specific integrated circuit","score":0.6719815731048584},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.5794280767440796},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5341400504112244},{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.5072538256645203},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.49913740158081055},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.486655056476593},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.4290856719017029},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.20193934440612793},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1657053828239441},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11294972896575928}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7621069550514221},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.6834968328475952},{"id":"https://openalex.org/C77390884","wikidata":"https://www.wikidata.org/wiki/Q217302","display_name":"Application-specific integrated circuit","level":2,"score":0.6719815731048584},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.5794280767440796},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5341400504112244},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.5072538256645203},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.49913740158081055},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.486655056476593},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.4290856719017029},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.20193934440612793},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1657053828239441},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11294972896575928},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isqed.2008.4479831","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isqed.2008.4479831","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"9th International Symposium on Quality Electronic Design (isqed 2008)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8899999856948853,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1974169079","https://openalex.org/W2001655225","https://openalex.org/W2096835686","https://openalex.org/W2101285334","https://openalex.org/W2104225326","https://openalex.org/W2107923684","https://openalex.org/W2117285153","https://openalex.org/W2130766965","https://openalex.org/W2144915013","https://openalex.org/W2155509874","https://openalex.org/W2165108487","https://openalex.org/W2535965777","https://openalex.org/W2537134123","https://openalex.org/W4249006057","https://openalex.org/W4255734830"],"related_works":["https://openalex.org/W2293118914","https://openalex.org/W2998381397","https://openalex.org/W4236419692","https://openalex.org/W3167919718","https://openalex.org/W4251718783","https://openalex.org/W2171015181","https://openalex.org/W2999668243","https://openalex.org/W1485756991","https://openalex.org/W2376218453","https://openalex.org/W2984236338"],"abstract_inverted_index":{"Portable":[0],"embedded":[1,66,174],"SoC":[2,67],"processor":[3,83,175,238],"architects":[4],"are":[5,77],"constantly":[6],"challenged":[7],"by":[8,176,209,223,242],"exponentially":[9],"increasing":[10],"demand":[11],"for":[12,260],"newer":[13],"functionality,":[14],"faster":[15],"real-time":[16],"communication,":[17],"stronger":[18],"security,":[19],"and":[20,32,109,121,133,164,186,200,234,240,246,256],"higher":[21],"reliability;":[22],"while":[23,105],"the":[24,60,64,81,88,99,116,153,178,214,236],"constraint":[25],"on":[26,51],"energy,":[27],"feature":[28],"size,":[29],"NRE":[30,108],"cost,":[31],"time-to-market":[33],"(TTM)":[34],"grows":[35],"tighter":[36],"than":[37],"ever.":[38],"Existing":[39],"approaches":[40],"attempting":[41],"to":[42,56,80,86,161,197,254],"achieve":[43,95],"these":[44,126],"mutual":[45],"conflicting":[46],"design":[47,147],"goals":[48],"rely":[49],"heavily":[50],"adopting":[52],"special-purpose":[53],"accelerators":[54],"(SPA)":[55],"take":[57],"charge":[58],"of":[59,91,101,118,156,173,213],"heavy":[61],"lifting":[62],"in":[63],"aimed":[65],"designs.":[68],"These":[69],"SPAs,":[70],"synthesized":[71],"from":[72,152],"either":[73],"ASIC":[74],"or":[75],"FPGA,":[76],"usually":[78],"augmented":[79],"base":[82],"as":[84,128,203],"co-processors":[85,129],"execute":[87],"performance-critical":[89],"regions":[90],"applications.":[92],"ASIC-based":[93],"SPAs":[94,112,127,160],"performance-energy":[96],"efficiency":[97],"at":[98,115],"expense":[100,117],"sacrificing":[102],"post-manufacturing":[103],"programmability":[104,114],"incurring":[106],"large":[107],"TTM;":[110],"FPGA-based":[111],"retain":[113],"significant":[119],"energy":[120],"area":[122,264],"increase.":[123,265],"Furthermore,":[124],"augmenting":[125],"adds":[130],"considerable":[131],"communication":[132],"synchronization":[134],"overhead":[135],"severely":[136],"compromising":[137],"their":[138],"initially":[139],"promised":[140],"benefits.":[141],"This":[142],"paper":[143],"proposes":[144],"an":[145,162],"innovative":[146],"paradigm":[148],"that":[149],"moves":[150],"away":[151],"common":[154],"scheme":[155],"adding":[157],"co-processing":[158],"ASIC/FPGA":[159],"integrated":[163],"reconfigurable":[165],"design.":[166],"Specifically,":[167],"we":[168],"propose":[169],"a":[170,183,204,224],"new":[171],"class":[172],"replacing":[177],"processor's":[179],"conventional":[180],"ALU":[181],"with":[182,262],"more":[184],"powerful":[185],"flexible":[187],"versatile":[188],"processing":[189],"unit":[190],"(VPU).":[191],"VPU":[192,207,229],"enables":[193],"multiple":[194],"interdependent":[195],"instructions":[196],"be":[198],"fused":[199],"processed":[201],"together":[202],"single":[205],"atomic":[206],"instruction":[208,218],"exploring":[210],"dataflow":[211],"dependencies":[212],"application":[215],"code.":[216,249],"The":[217,227],"fusion":[219],"is":[220],"automatically":[221],"performed":[222],"VPU-aware":[225],"compiler.":[226],"optimized":[228],"code":[230,232],"reduces":[231],"size":[233],"amplifies":[235],"effective":[237],"bandwidth":[239],"capacity":[241],"eliminating":[243],"transient":[244],"computation":[245],"register":[247],"spill":[248],"Experimental":[250],"results":[251],"show":[252],"up":[253],"400%":[255],"average":[257],"150%":[258],"speedup":[259],"MediaBench":[261],"negligible":[263]},"counts_by_year":[{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
