{"id":"https://openalex.org/W3189151771","doi":"https://doi.org/10.1109/tcad.2021.3103825","title":"A Tensor Processing Framework for CPU-Manycore Heterogeneous Systems","display_name":"A Tensor Processing Framework for CPU-Manycore Heterogeneous Systems","publication_year":2021,"publication_date":"2021-08-10","ids":{"openalex":"https://openalex.org/W3189151771","doi":"https://doi.org/10.1109/tcad.2021.3103825","mag":"3189151771"},"language":"en","primary_location":{"id":"doi:10.1109/tcad.2021.3103825","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2021.3103825","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101558751","display_name":"Lin Cheng","orcid":"https://orcid.org/0000-0003-4551-2002"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Lin Cheng","raw_affiliation_strings":["School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082177621","display_name":"Peitian Pan","orcid":"https://orcid.org/0000-0001-6147-9092"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Peitian Pan","raw_affiliation_strings":["School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062730166","display_name":"Zhongyuan Zhao","orcid":"https://orcid.org/0000-0002-6637-553X"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhongyuan Zhao","raw_affiliation_strings":["School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102790014","display_name":"Krithik Ranjan","orcid":"https://orcid.org/0000-0002-6083-6251"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Krithik Ranjan","raw_affiliation_strings":["School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055013888","display_name":"Jack Weber","orcid":"https://orcid.org/0000-0002-1688-6358"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]},{"id":"https://openalex.org/I4210099672","display_name":"Accenture (United States)","ror":"https://ror.org/013g16z83","country_code":"US","type":"company","lineage":["https://openalex.org/I4210093804","https://openalex.org/I4210099672"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jack Weber","raw_affiliation_strings":["School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","Accenture, New York, NY, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]},{"raw_affiliation_string":"Accenture, New York, NY, USA","institution_ids":["https://openalex.org/I4210099672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080881573","display_name":"Bandhav Veluri","orcid":"https://orcid.org/0000-0002-5086-9092"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bandhav Veluri","raw_affiliation_strings":["Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA"],"affiliations":[{"raw_affiliation_string":"Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068378841","display_name":"Seyed Borna Ehsani","orcid":"https://orcid.org/0000-0001-9832-9397"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]},{"id":"https://openalex.org/I4210153776","display_name":"Apple (United States)","ror":"https://ror.org/059hsda18","country_code":"US","type":"company","lineage":["https://openalex.org/I4210153776"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Seyed Borna Ehsani","raw_affiliation_strings":["Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA","Apple Inc., Los Altos, CA, USA"],"affiliations":[{"raw_affiliation_string":"Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]},{"raw_affiliation_string":"Apple Inc., Los Altos, CA, USA","institution_ids":["https://openalex.org/I4210153776"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088602116","display_name":"Max Ruttenberg","orcid":null},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Max Ruttenberg","raw_affiliation_strings":["Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA"],"affiliations":[{"raw_affiliation_string":"Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075265279","display_name":"Dai Cheol Jung","orcid":"https://orcid.org/0000-0002-3165-4213"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dai Cheol Jung","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Washington, Seattle, WA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031613824","display_name":"Preslav Ivanov","orcid":null},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Preslav Ivanov","raw_affiliation_strings":["School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021087747","display_name":"Dustin Richmond","orcid":"https://orcid.org/0000-0002-4587-8947"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dustin Richmond","raw_affiliation_strings":["Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA"],"affiliations":[{"raw_affiliation_string":"Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036770962","display_name":"Michael Taylor","orcid":"https://orcid.org/0000-0002-4074-6347"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael B. Taylor","raw_affiliation_strings":["Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA"],"affiliations":[{"raw_affiliation_string":"Paul Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037210004","display_name":"Zhiru Zhang","orcid":"https://orcid.org/0000-0002-0778-0308"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhiru Zhang","raw_affiliation_strings":["School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091660287","display_name":"Christopher Batten","orcid":"https://orcid.org/0000-0002-2835-667X"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christopher Batten","raw_affiliation_strings":["School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5101558751"],"corresponding_institution_ids":["https://openalex.org/I205783295"],"apc_list":null,"apc_paid":null,"fwci":1.8865,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.85545677,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"41","issue":"6","first_page":"1620","last_page":"1635"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9782000184059143,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8367737531661987},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6585821509361267},{"id":"https://openalex.org/keywords/programmer","display_name":"Programmer","score":0.6404290199279785},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.6037760376930237},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.5684293508529663},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.5191013813018799},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.4551198482513428},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.4257733225822449},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.29889553785324097},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2182237207889557}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8367737531661987},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6585821509361267},{"id":"https://openalex.org/C2778514511","wikidata":"https://www.wikidata.org/wiki/Q1374194","display_name":"Programmer","level":2,"score":0.6404290199279785},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.6037760376930237},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.5684293508529663},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.5191013813018799},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.4551198482513428},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.4257733225822449},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.29889553785324097},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2182237207889557},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcad.2021.3103825","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2021.3103825","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.9100000262260437}],"awards":[{"id":"https://openalex.org/G4502277801","display_name":null,"funder_award_id":"FA8650-18-2-7863","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G4667086366","display_name":null,"funder_award_id":"1527065","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5266476110","display_name":null,"funder_award_id":"1909661","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7348766185","display_name":null,"funder_award_id":"1512937","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320308737","display_name":"Facebook","ror":"https://ror.org/01zbnvs85"},{"id":"https://openalex.org/F4320314786","display_name":"Xilinx","ror":"https://ror.org/01rb7bk56"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1495581870","https://openalex.org/W1541688521","https://openalex.org/W1969648707","https://openalex.org/W1974420955","https://openalex.org/W1978301594","https://openalex.org/W2017503457","https://openalex.org/W2051598123","https://openalex.org/W2112678088","https://openalex.org/W2143230897","https://openalex.org/W2152839228","https://openalex.org/W2165100134","https://openalex.org/W2194775991","https://openalex.org/W2239894058","https://openalex.org/W2415360376","https://openalex.org/W2474840560","https://openalex.org/W2528553838","https://openalex.org/W2588467645","https://openalex.org/W2606722458","https://openalex.org/W2614094030","https://openalex.org/W2626211758","https://openalex.org/W2798280240","https://openalex.org/W2798482398","https://openalex.org/W2798598799","https://openalex.org/W2804032941","https://openalex.org/W2953384591","https://openalex.org/W2962914733","https://openalex.org/W2963114857","https://openalex.org/W2965444073","https://openalex.org/W2982126433","https://openalex.org/W2990013837","https://openalex.org/W2990912491","https://openalex.org/W3006586535","https://openalex.org/W3015690986","https://openalex.org/W3016735325","https://openalex.org/W3024621361","https://openalex.org/W3103168911","https://openalex.org/W3112773671","https://openalex.org/W3140062895","https://openalex.org/W3140261852","https://openalex.org/W3189388815","https://openalex.org/W4244452576","https://openalex.org/W4244721345","https://openalex.org/W4245683599","https://openalex.org/W4288083528","https://openalex.org/W4295312788","https://openalex.org/W6713134421","https://openalex.org/W6766978945"],"related_works":["https://openalex.org/W2379153735","https://openalex.org/W2046172023","https://openalex.org/W2972896947","https://openalex.org/W2170146914","https://openalex.org/W2355105570","https://openalex.org/W2083974823","https://openalex.org/W2072751097","https://openalex.org/W4237177615","https://openalex.org/W3023876411","https://openalex.org/W123152114"],"abstract_inverted_index":{"Future":[0],"CPU-manycore":[1,95,205],"heterogeneous":[2,96,206],"systems":[3],"can":[4,186],"provide":[5],"high":[6,30],"peak":[7,31],"throughput":[8,32,220],"by":[9],"integrating":[10],"thousands":[11],"of":[12,154,168],"simple,":[13],"independent,":[14],"energy-efficient":[15],"cores":[16,58],"in":[17],"a":[18,75,137,152,164,169,202],"single":[19],"die.":[20],"However,":[21],"there":[22],"are":[23],"two":[24,127],"key":[25],"challenges":[26],"to":[27,61,89,111,142,201,209,226],"translating":[28],"this":[29,72],"into":[33],"improved":[34,222],"end-to-end":[35],"workload":[36],"performance:":[37],"1)":[38],"manycore":[39,54,69,101,171],"co-processors":[40,55],"rely":[41],"on":[42,48,83,94,163,175],"simple":[43],"hardware":[44,121,139],"putting":[45],"significant":[46],"demands":[47],"the":[49,68,100,113],"software":[50,119],"programmer":[51],"and":[52,77,120,132,158,179,221],"2)":[53],"use":[56,106],"in-order":[57],"that":[59,85],"struggle":[60],"tolerate":[62],"long":[63],"memory":[64,102],"latencies.":[65],"To":[66,98],"address":[67,99],"programmability":[70],"challenge,":[71,104],"article":[73],"presents":[74],"dense":[76,178],"sparse":[78,180],"tensor":[79,181],"processing":[80,229],"framework":[81,110],"based":[82],"PyTorch":[84,109,155,160],"enables":[86],"domain":[87],"experts":[88],"easily":[90],"accelerate":[91],"off-the-shelf":[92],"workloads":[93,161,182,185],"systems.":[97],"latency":[103],"we":[105,125],"our":[107,149],"extended":[108],"explore":[112],"potential":[114],"for":[115],"decoupled":[116],"access/execute":[117],"(DAE)":[118],"mechanisms.":[122],"More":[123],"specifically,":[124],"propose":[126],"software-only":[128],"techniques,":[129],"na\u00efve-software":[130],"DAE":[131],"systolic-software":[133],"DAE,":[134],"along":[135],"with":[136],"lightweight":[138],"access":[140],"accelerator":[141],"further":[143],"improve":[144],"area-normalized":[145,219],"throughput.":[146],"We":[147],"evaluate":[148],"techniques":[150],"using":[151],"combination":[153],"operator":[156],"microbenchmarking":[157],"real-world":[159,177],"running":[162],"detailed":[165],"register-transfer-level":[166],"model":[167],"128-core":[170],"architecture.":[172],"Our":[173],"evaluation":[174],"three":[176],"suggests":[183],"these":[184],"achieve":[187],"approximately":[188],"2\u2013":[189],"<inline-formula":[190],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[191],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[192],"<tex-math":[193],"notation=\"LaTeX\">$6\\times":[194],"$":[195],"</tex-math></inline-formula>":[196],"performance":[197],"improvement":[198],"when":[199],"scaled":[200],"future":[203],"2000-core":[204],"system":[207],"compared":[208,225],"an":[210],"18-core":[211],"out-of-order":[212],"CPU":[213],"baseline,":[214],"while":[215],"potentially":[216],"achieving":[217],"higher":[218],"energy":[223],"efficiency":[224],"general-purpose":[227],"graphics":[228],"units.":[230]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
