{"id":"https://openalex.org/W4409248516","doi":"https://doi.org/10.1109/hpca61900.2025.00048","title":"SoMa: Identifying, Exploring, and Understanding the DRAM Communication Scheduling Space for DNN Accelerators","display_name":"SoMa: Identifying, Exploring, and Understanding the DRAM Communication Scheduling Space for DNN Accelerators","publication_year":2025,"publication_date":"2025-03-01","ids":{"openalex":"https://openalex.org/W4409248516","doi":"https://doi.org/10.1109/hpca61900.2025.00048"},"language":"en","primary_location":{"id":"doi:10.1109/hpca61900.2025.00048","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca61900.2025.00048","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001158014","display_name":"Jingwei Cai","orcid":"https://orcid.org/0009-0003-7560-8141"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingwei Cai","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100329001","display_name":"Xuan Wang","orcid":"https://orcid.org/0000-0002-5808-1929"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuan Wang","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003379072","display_name":"Mingyu Gao","orcid":"https://orcid.org/0000-0001-9377-9292"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingyu Gao","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102847848","display_name":"Sen Peng","orcid":"https://orcid.org/0009-0002-5312-2557"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sen Peng","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100945324","display_name":"Zijian Zhu","orcid":"https://orcid.org/0000-0002-8867-0281"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zijian Zhu","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010247448","display_name":"Yuchen Wei","orcid":"https://orcid.org/0009-0003-5752-5422"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuchen Wei","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087025919","display_name":"Zuotong Wu","orcid":"https://orcid.org/0009-0000-1368-661X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zuotong Wu","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006570986","display_name":"Kaisheng Ma","orcid":"https://orcid.org/0000-0001-9226-3366"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaisheng Ma","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5001158014"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":4.1568,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.93691785,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"533","last_page":"548"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11005","display_name":"Radiation Effects in Electronics","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11005","display_name":"Radiation Effects in Electronics","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":0.9836000204086304,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11044","display_name":"Particle Detector Development and Performance","score":0.9822999835014343,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/soma","display_name":"Soma","score":0.8202361464500427},{"id":"https://openalex.org/keywords/dram","display_name":"Dram","score":0.7754764556884766},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7369664907455444},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6027415990829468},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.40411123633384705},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.363675594329834},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.13827988505363464},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.10658064484596252},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.10238584876060486},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.08408638834953308}],"concepts":[{"id":"https://openalex.org/C2779617337","wikidata":"https://www.wikidata.org/wiki/Q842429","display_name":"Soma","level":2,"score":0.8202361464500427},{"id":"https://openalex.org/C7366592","wikidata":"https://www.wikidata.org/wiki/Q1255620","display_name":"Dram","level":2,"score":0.7754764556884766},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7369664907455444},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6027415990829468},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.40411123633384705},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.363675594329834},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.13827988505363464},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.10658064484596252},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.10238584876060486},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.08408638834953308},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca61900.2025.00048","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca61900.2025.00048","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322392","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W2048266589","https://openalex.org/W2152839228","https://openalex.org/W2194775991","https://openalex.org/W2605347906","https://openalex.org/W2906043559","https://openalex.org/W2981985696","https://openalex.org/W2982050681","https://openalex.org/W2982135357","https://openalex.org/W2997929983","https://openalex.org/W3012493694","https://openalex.org/W3090495278","https://openalex.org/W3135242540","https://openalex.org/W3135807226","https://openalex.org/W3193212547","https://openalex.org/W4248707617","https://openalex.org/W4249932213","https://openalex.org/W4280562683","https://openalex.org/W4281708879","https://openalex.org/W4288083528","https://openalex.org/W4292169167","https://openalex.org/W4318541578","https://openalex.org/W4360831791","https://openalex.org/W4360831828","https://openalex.org/W4380881063","https://openalex.org/W4380881154","https://openalex.org/W4385245566","https://openalex.org/W4388626384","https://openalex.org/W4393592481","https://openalex.org/W4401211704","https://openalex.org/W6694260854","https://openalex.org/W6736288088","https://openalex.org/W6755207826","https://openalex.org/W6761458982","https://openalex.org/W6766720298","https://openalex.org/W6769715254","https://openalex.org/W6776015948","https://openalex.org/W6782615464","https://openalex.org/W6784702356","https://openalex.org/W6794326018","https://openalex.org/W6794597259","https://openalex.org/W6799534101","https://openalex.org/W6799690380","https://openalex.org/W6821704442","https://openalex.org/W6847801047","https://openalex.org/W6861427027"],"related_works":["https://openalex.org/W2101180249","https://openalex.org/W3120961607","https://openalex.org/W2040277507","https://openalex.org/W4401568740","https://openalex.org/W3192405764","https://openalex.org/W3148568549","https://openalex.org/W2323108107","https://openalex.org/W2033189714","https://openalex.org/W2098207691","https://openalex.org/W2010336780"],"abstract_inverted_index":{"Modern":[0],"Deep":[1],"Neural":[2],"Network":[3],"(DNN)":[4],"accelerators":[5,183],"are":[6],"equipped":[7],"with":[8,207],"increasingly":[9,20,76],"larger":[10],"on-chip":[11],"buffers":[12,41],"to":[13,17,45,72,81,135,153,170,233],"provide":[14],"more":[15],"opportunities":[16,102],"alleviate":[18],"the":[19,53,75,100,109,115,121,127,162,175,208,245],"severe":[21],"DRAM":[22,60,83,104,156,166,178,246],"bandwidth":[23],"pressure.":[24],"However,":[25],"most":[26,47,51],"existing":[27,112],"research":[28],"on":[29,35,59,114,215],"buffer":[30,79],"utilization":[31],"still":[32],"primarily":[33],"focuses":[34],"single-layer":[36,48,56],"dataflow":[37,57],"scheduling":[38,106,126,158,180,190,248],"optimization.":[39],"As":[40],"grow":[42],"large":[43],"enough":[44],"accommodate":[46],"weights":[49],"in":[50,103,125,225],"networks,":[52],"impact":[54],"of":[55,111,129,165,177],"optimization":[58,101,123,141],"communication":[61,105,157,167,179,247],"diminishes":[62],"significantly.":[63],"Therefore,":[64],"developing":[65],"new":[66],"paradigms":[67],"that":[68],"fuse":[69],"multiple":[70],"layers":[71],"fully":[73,138],"leverage":[74,231],"abundant":[77],"onchip":[78],"resources":[80],"reduce":[82],"accesses":[84],"has":[85,194,260],"become":[86],"particularly":[87],"important,":[88],"yet":[89],"remains":[90],"an":[91,188],"open":[92],"challenge.To":[93],"address":[94],"this":[95],"challenge,":[96],"we":[97,143,186,230],"first":[98],"identify":[99],"by":[107],"analyzing":[108],"drawbacks":[110],"works":[113],"layer":[116],"fusion":[117],"paradigm":[118],"and":[119,133,148,160,172,184,221,243],"recognizing":[120],"vast":[122],"potential":[124],"timing":[128],"data":[130],"prefetching":[131],"from":[132],"storing":[134],"DRAM.":[136],"To":[137],"exploit":[139],"these":[140],"opportunities,":[142],"develop":[144,187],"a":[145,199,217,222,251],"Tensor-centric":[146],"Notation":[147],"its":[149],"corresponding":[150],"parsing":[151],"method":[152],"represent":[154],"different":[155],"schemes":[159],"depict":[161],"overall":[163],"space":[164,176,240,249],"scheduling.":[168],"Then,":[169,229],"thoroughly":[171],"efficiently":[173],"explore":[174],"for":[181,201,236],"diverse":[182],"workloads,":[185],"end-to-end":[189],"framework,":[191,212],"SoMa,":[192],"which":[193],"already":[195],"been":[196,261],"developed":[197],"into":[198],"compiler":[200],"our":[202],"commercial":[203],"accelerator":[204],"product.":[205],"Compared":[206],"state-of-the-art":[209],"(SOTA)":[210],"Cocco":[211],"SoMa":[213,232,259],"achieves,":[214],"average,":[216],"2.11\u00d7":[218],"performance":[219],"improvement":[220],"37.3%":[223],"reduction":[224],"energy":[226],"cost":[227],"simultaneously.":[228],"study":[234],"optimizations":[235],"LLM,":[237],"perform":[238],"design":[239],"exploration":[241],"(DSE),":[242],"analyze":[244],"through":[250],"practical":[252],"example,":[253],"yielding":[254],"some":[255],"interesting":[256],"insights.":[257],"Moreover,":[258],"open-sourced":[262],"at":[263],"https://github.com/SET-Scheduling-Project/SoMa-HPCA2025.":[264]},"counts_by_year":[{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-04T09:10:02.777135","created_date":"2025-10-10T00:00:00"}
