{"id":"https://openalex.org/W4389491968","doi":"https://doi.org/10.1145/3613424.3614268","title":"MAICC : A Lightweight Many-core Architecture with In-Cache Computing for Multi-DNN Parallel Inference","display_name":"MAICC : A Lightweight Many-core Architecture with In-Cache Computing for Multi-DNN Parallel Inference","publication_year":2023,"publication_date":"2023-10-28","ids":{"openalex":"https://openalex.org/W4389491968","doi":"https://doi.org/10.1145/3613424.3614268"},"language":"en","primary_location":{"id":"doi:10.1145/3613424.3614268","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3613424.3614268","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3613424.3614268","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"56th Annual IEEE/ACM International Symposium on Microarchitecture","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3613424.3614268","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101735762","display_name":"Renhao Fan","orcid":"https://orcid.org/0009-0002-9136-1831"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Renhao Fan","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, China"],"raw_orcid":"https://orcid.org/0009-0002-9136-1831","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102005731","display_name":"Yikai Cui","orcid":"https://orcid.org/0000-0001-6283-8405"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yikai Cui","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, China"],"raw_orcid":"https://orcid.org/0000-0001-6283-8405","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012080243","display_name":"Qilin Chen","orcid":"https://orcid.org/0000-0002-1872-1290"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qilin Chen","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, China"],"raw_orcid":"https://orcid.org/0000-0002-1872-1290","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100350118","display_name":"Mingyu Wang","orcid":"https://orcid.org/0000-0003-4006-8870"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingyu Wang","raw_affiliation_strings":["School of Microelectronics Science and Technology, Sun Yat-Sen University, China"],"raw_orcid":"https://orcid.org/0000-0003-4006-8870","affiliations":[{"raw_affiliation_string":"School of Microelectronics Science and Technology, Sun Yat-Sen University, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016596981","display_name":"Youhui Zhang","orcid":"https://orcid.org/0000-0003-2333-3580"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Youhui Zhang","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, China and Zhongguancun Laboratory, China"],"raw_orcid":"https://orcid.org/0000-0003-2333-3580","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, China and Zhongguancun Laboratory, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101713157","display_name":"Weimin Zheng","orcid":"https://orcid.org/0009-0008-3026-2278"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weimin Zheng","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, China"],"raw_orcid":"https://orcid.org/0009-0008-3026-2278","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057648062","display_name":"Zhaolin Li","orcid":"https://orcid.org/0009-0001-1131-3024"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhaolin Li","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, China"],"raw_orcid":"https://orcid.org/0009-0001-1131-3024","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.0105,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.79133279,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"411","last_page":"423"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8690098524093628},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6698595881462097},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.6006233096122742},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.5761493444442749},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.5612742304801941},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5062462687492371},{"id":"https://openalex.org/keywords/microarchitecture","display_name":"Microarchitecture","score":0.4417303800582886},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.41123026609420776},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.38184854388237},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.14584267139434814}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8690098524093628},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6698595881462097},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.6006233096122742},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.5761493444442749},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.5612742304801941},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5062462687492371},{"id":"https://openalex.org/C107598950","wikidata":"https://www.wikidata.org/wiki/Q259864","display_name":"Microarchitecture","level":2,"score":0.4417303800582886},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.41123026609420776},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.38184854388237},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.14584267139434814}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3613424.3614268","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3613424.3614268","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3613424.3614268","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"56th Annual IEEE/ACM International Symposium on Microarchitecture","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3613424.3614268","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3613424.3614268","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3613424.3614268","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"56th Annual IEEE/ACM International Symposium on Microarchitecture","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.8999999761581421,"id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G1799504355","display_name":null,"funder_award_id":"No.62250006, 62072266, 62204271","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3040571651","display_name":null,"funder_award_id":"62204271","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G330528761","display_name":null,"funder_award_id":"2020YFB1600200","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G3911511746","display_name":null,"funder_award_id":"62250006","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G404823856","display_name":null,"funder_award_id":"No.2020YFB1600200","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G6132722138","display_name":"\u7c7b\u8111\u8ba1\u7b97\u7cfb\u7edf\u5c42\u6b21\u7ed3\u6784\u4e0e\u5b8c\u5907\u6027\u7814\u7a76","funder_award_id":"62072266","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G835360120","display_name":null,"funder_award_id":"BNR2022RC01003","funder_id":"https://openalex.org/F4320329777","funder_display_name":"Beijing National Research Center For Information Science And Technology"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322392","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549"},{"id":"https://openalex.org/F4320329777","display_name":"Beijing National Research Center For Information Science And Technology","ror":null},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4389491968.pdf","grobid_xml":"https://content.openalex.org/works/W4389491968.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W1977661221","https://openalex.org/W2064675550","https://openalex.org/W2097117768","https://openalex.org/W2102605133","https://openalex.org/W2118231264","https://openalex.org/W2170382128","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2331783522","https://openalex.org/W2442974303","https://openalex.org/W2588467645","https://openalex.org/W2605347906","https://openalex.org/W2606722458","https://openalex.org/W2612690371","https://openalex.org/W2798598799","https://openalex.org/W2804032941","https://openalex.org/W2883929540","https://openalex.org/W2935331687","https://openalex.org/W2950138172","https://openalex.org/W2963037989","https://openalex.org/W2963122961","https://openalex.org/W2972054167","https://openalex.org/W2976137532","https://openalex.org/W2976534600","https://openalex.org/W2981207549","https://openalex.org/W2994193159","https://openalex.org/W2996945478","https://openalex.org/W3006586535","https://openalex.org/W3048581975","https://openalex.org/W3112773671","https://openalex.org/W3187235458","https://openalex.org/W3189151771","https://openalex.org/W3201271601","https://openalex.org/W4253012315","https://openalex.org/W4310362310"],"related_works":["https://openalex.org/W1547865754","https://openalex.org/W2276000909","https://openalex.org/W122453572","https://openalex.org/W2466405623","https://openalex.org/W2131429702","https://openalex.org/W3023876411","https://openalex.org/W2351011383","https://openalex.org/W2146879484","https://openalex.org/W4221002079","https://openalex.org/W1757458251"],"abstract_inverted_index":{"The":[0,105],"growing":[1],"complexity":[2],"and":[3,14,40,54,67,90,145,166,191,213,239],"diversity":[4],"of":[5,11,21,52,77,98,127,161],"neural":[6],"networks":[7],"in":[8,122,135],"the":[9,19,49,73,83,108,123,132,142,146,150,155,162,167,185,204],"fields":[10],"autonomous":[12],"driving":[13],"intelligent":[15],"robots":[16],"have":[17],"facilitated":[18],"research":[20],"many-core":[22,57,92,186],"architectures,":[23],"which":[24,194],"can":[25,138],"offer":[26],"sufficient":[27],"programming":[28],"flexibility":[29],"to":[30,43,48,71,113,179],"simultaneously":[31],"support":[32],"multi-DNN":[33,78,197],"parallel":[34,79,159,198],"inference":[35],"with":[36,102,149,154,234],"different":[37],"network":[38],"structures":[39],"sizes":[41],"compared":[42],"domain-specific":[44],"architectures.":[45],"However,":[46],"due":[47],"tight":[50],"constraints":[51],"area":[53],"power":[55],"consumption,":[56],"architectures":[58],"typically":[59],"use":[60],"lightweight":[61,99],"scalar":[62],"cores":[63,101],"without":[64],"vector":[65,115,170],"units":[66],"are":[68],"almost":[69],"unable":[70],"meet":[72],"high-performance":[74],"computing":[75,147],"needs":[76],"inference.":[80,199],"To":[81],"solve":[82],"above":[84],"problem,":[85],"we":[86],"design":[87],"an":[88],"area-":[89],"energy-efficient":[91],"architecture":[93,106,187,207],"by":[94,118,188],"integrating":[95],"large":[96],"amounts":[97],"processor":[100],"RV32IMA":[103],"ISA.":[104],"leverages":[107],"emerging":[109],"SRAM-based":[110],"computing-in-memory":[111],"technology":[112],"implement":[114],"instruction":[116],"extensions":[117],"reusing":[119],"memory":[120,143,238],"cells":[121],"data":[124,133],"cache":[125,134],"instead":[126],"conventional":[128],"logic":[129],"circuits.":[130],"Thus,":[131],"each":[136],"core":[137,156],"be":[139],"reconfigured":[140],"as":[141],"part":[144,148],"latter":[151],"tightly":[152],"coupled":[153],"pipeline,":[157],"enabling":[158],"execution":[160,175],"basic":[163],"RISC-V":[164],"instructions":[165],"extended":[168],"multi-cycle":[169],"instructions.":[171],"Furthermore,":[172],"a":[173,209,225],"corresponding":[174],"framework":[176],"is":[177],"proposed":[178,205],"effectively":[180],"map":[181],"DNN":[182],"models":[183],"onto":[184],"using":[189],"intra-layer":[190],"inter-layer":[192],"pipelining,":[193],"potentially":[195],"supports":[196],"Experimental":[200],"results":[201],"show":[202],"that":[203],"MAICC":[206,222],"obtains":[208],"4.3":[210],"\u00d7":[211,215,227],"throughput":[212],"31.6":[214],"energy":[216,228],"efficiency":[217,229],"over":[218,230],"CPU":[219],"(Intel":[220],"i9-13900k).":[221],"also":[223],"achieves":[224],"1.8":[226],"GPU":[231],"(RTX":[232],"4090)":[233],"only":[235],"4MB":[236],"on-chip":[237],"28":[240],"mm2":[241],"area.":[242]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
