{"id":"https://openalex.org/W4410583577","doi":"https://doi.org/10.23919/date64628.2025.10992996","title":"TCDM Burst Access: Breaking the Bandwidth Barrier in Shared-L1 RVV Clusters Beyond 1000 FPUs","display_name":"TCDM Burst Access: Breaking the Bandwidth Barrier in Shared-L1 RVV Clusters Beyond 1000 FPUs","publication_year":2025,"publication_date":"2025-03-31","ids":{"openalex":"https://openalex.org/W4410583577","doi":"https://doi.org/10.23919/date64628.2025.10992996"},"language":"en","primary_location":{"id":"doi:10.23919/date64628.2025.10992996","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date64628.2025.10992996","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Design, Automation &amp;amp; Test in Europe Conference (DATE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057255049","display_name":"Dejian Shen","orcid":"https://orcid.org/0000-0002-0283-6835"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Diyou Shen","raw_affiliation_strings":["ETH Z&#x00FC;rich,Integrated Systems Laboratory,Z&#x00FC;rich,Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Z&#x00FC;rich,Integrated Systems Laboratory,Z&#x00FC;rich,Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100625410","display_name":"Yichao Zhang","orcid":"https://orcid.org/0009-0008-7508-599X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yichao Zhang","raw_affiliation_strings":["ETH Z&#x00FC;rich,Integrated Systems Laboratory,Z&#x00FC;rich,Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Z&#x00FC;rich,Integrated Systems Laboratory,Z&#x00FC;rich,Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020963902","display_name":"Marco Bertuletti","orcid":"https://orcid.org/0000-0001-7576-0803"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marco Bertuletti","raw_affiliation_strings":["ETH Z&#x00FC;rich,Integrated Systems Laboratory,Z&#x00FC;rich,Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Z&#x00FC;rich,Integrated Systems Laboratory,Z&#x00FC;rich,Switzerland","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043408422","display_name":"Luca Benini","orcid":"https://orcid.org/0000-0001-8068-3806"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luca Benini","raw_affiliation_strings":["ETH Z&#x00FC;rich,Integrated Systems Laboratory,Z&#x00FC;rich,Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Z&#x00FC;rich,Integrated Systems Laboratory,Z&#x00FC;rich,Switzerland","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5057255049"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.11556796,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12146","display_name":"Power Line Communications and Noise","score":0.9016000032424927,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12146","display_name":"Power Line Communications and Noise","score":0.9016000032424927,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.622319221496582},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5687416791915894},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.45654749870300293}],"concepts":[{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.622319221496582},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5687416791915894},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.45654749870300293}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.23919/date64628.2025.10992996","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date64628.2025.10992996","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Design, Automation &amp;amp; Test in Europe Conference (DATE)","raw_type":"proceedings-article"},{"id":"pmh:oai:cris.unibo.it:11585/1040791","is_oa":false,"landing_page_url":"https://hdl.handle.net/11585/1040791","pdf_url":null,"source":{"id":"https://openalex.org/S4306402579","display_name":"Archivio istituzionale della ricerca (Alma Mater Studiorum Universit\u00e0 di Bologna)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210117483","host_organization_name":"Istituto di Ematologia di Bologna","host_organization_lineage":["https://openalex.org/I4210117483"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2795268038","https://openalex.org/W2945665019","https://openalex.org/W3184037151","https://openalex.org/W4206371601","https://openalex.org/W4286563542","https://openalex.org/W4312968147","https://openalex.org/W4376481202","https://openalex.org/W4386025602","https://openalex.org/W4386090486","https://openalex.org/W4396816723","https://openalex.org/W4402475804","https://openalex.org/W6738791726","https://openalex.org/W6987026237"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"As":[0],"computing":[1],"demand":[2],"and":[3,41,50,178,197,215,240],"memory":[4,18,43,81,126],"footprint":[5],"of":[6,12,173,204],"deep":[7],"learning":[8],"applications":[9],"accelerate,":[10],"clusters":[11,102],"cores":[13,40,106],"sharing":[14],"local":[15],"(L1)":[16],"multi-banked":[17,111],"are":[19,54,61,134],"widely":[20],"used":[21],"as":[22,79],"key":[23],"building":[24],"blocks":[25],"in":[26,101,136,221,243],"large-scale":[27],"architectures.":[28],"When":[29],"the":[30,87,155,171,205,228],"cluster's":[31],"core":[32,159],"count":[33],"increases,":[34],"a":[35,46,92,110,118,148,174,176,179],"flat":[36],"all-to-all":[37],"interconnect":[38],"between":[39],"L1":[42,112,125],"banks":[44],"becomes":[45],"physical":[47],"implementation":[48],"bottleneck,":[49],"hierarchical":[51],"network":[52],"topologies":[53],"required.":[55],"However,":[56],"hierarchical,":[57],"multilevel":[58],"intra-cluster":[59],"networks":[60],"subject":[62],"to":[63,69,97,109,124,202,227,236],"internal":[64],"contention":[65],"which":[66],"may":[67],"lead":[68],"significant":[70],"performance":[71,218,242],"degradation,":[72],"especially":[73],"for":[74],"SIMD":[75],"or":[76],"vector":[77,105],"cores,":[78],"their":[80],"access":[82,230],"is":[83],"bursty.":[84],"We":[85,143],"present":[86],"TCDM":[88],"Burst":[89,119,192],"Access":[90],"architecture,":[91],"software-transparent":[93],"burst":[94,122,132],"transaction":[95],"support":[96],"improve":[98,170],"bandwidth":[99,172,213],"utilization":[100,214],"with":[103,140],"many":[104],"tightly":[107],"coupled":[108],"data":[113],"memory.":[114],"In":[115],"our":[116,145,209,232],"solution,":[117],"Manager":[120],"dispatches":[121],"requests":[123],"banks,":[127],"multiple":[128],"32b":[129],"words":[130],"from":[131],"responses":[133],"retired":[135],"parallel":[137],"on":[138,147,157],"channels":[139],"parametric":[141],"data-width.":[142],"validate":[144],"design":[146,210],"RISC-V":[149],"Vector":[150],"(RVV)":[151],"many-core":[152],"cluster,":[153],"evaluating":[154],"benefits":[156],"different":[158],"counts.":[160],"With":[161],"minimal":[162],"logic":[163],"area":[164],"overhead":[165],"(less":[166],"than":[167],"8%),":[168],"we":[169],"16-,":[175],"256-,":[177],"1024-Floating":[180],"Point":[181],"Unit":[182],"(FPU)":[183],"baseline":[184],"clusters,":[185],"without":[186],"Tightly":[187],"Coupled":[188],"Data":[189],"Memory":[190],"(TCDM)":[191],"Access,":[193],"by":[194],"118%,":[195],"226%,":[196],"77%":[198],"respectively.":[199],"Reaching":[200],"up":[201,235],"80%":[203],"cores-memory":[206],"peak":[207],"bandwidth,":[208],"demonstrates":[211],"ultra-high":[212],"enables":[216],"efficient":[217],"scaling.":[219],"Implemented":[220],"12-nm":[222],"FinFET":[223],"technology":[224],"node,":[225],"compared":[226],"serialized":[229],"baseline,":[231],"solution":[233],"achieves":[234],"1.9x":[237],"energy":[238],"efficiency":[239],"2.76x":[241],"real-world":[244],"kernel":[245],"benchmarkings.":[246]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
