{"id":"https://openalex.org/W2783347670","doi":"https://doi.org/10.1109/asicon.2017.8252595","title":"A chain-multiplier for large scale matrix multiplication","display_name":"A chain-multiplier for large scale matrix multiplication","publication_year":2017,"publication_date":"2017-10-01","ids":{"openalex":"https://openalex.org/W2783347670","doi":"https://doi.org/10.1109/asicon.2017.8252595","mag":"2783347670"},"language":"en","primary_location":{"id":"doi:10.1109/asicon.2017.8252595","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asicon.2017.8252595","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE 12th International Conference on ASIC (ASICON)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031128024","display_name":"Can Wei","orcid":"https://orcid.org/0000-0003-4291-7653"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Can Wei","raw_affiliation_strings":["Institute of VLSI Design, Hefei University of Technology, Hefei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"Institute of VLSI Design, Hefei University of Technology, Hefei, Anhui, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114973839","display_name":"Yukun Song","orcid":"https://orcid.org/0009-0004-9843-3505"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yukun Song","raw_affiliation_strings":["Institute of VLSI Design, Hefei University of Technology, Hefei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"Institute of VLSI Design, Hefei University of Technology, Hefei, Anhui, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001713932","display_name":"Duoli Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Duoli Zhang","raw_affiliation_strings":["Institute of VLSI Design, Hefei University of Technology, Hefei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"Institute of VLSI Design, Hefei University of Technology, Hefei, Anhui, China","institution_ids":["https://openalex.org/I16365422"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5031128024"],"corresponding_institution_ids":["https://openalex.org/I16365422"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.20966782,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":93},"biblio":{"volume":null,"issue":null,"first_page":"792","last_page":"795"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.71732097864151},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.6959478259086609},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6750311851501465},{"id":"https://openalex.org/keywords/systolic-array","display_name":"Systolic array","score":0.5636545419692993},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.5592122077941895},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.5320547223091125},{"id":"https://openalex.org/keywords/multiplier","display_name":"Multiplier (economics)","score":0.5074395537376404},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.5001819133758545},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4324647784233093},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.4122586250305176},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3277202248573303},{"id":"https://openalex.org/keywords/very-large-scale-integration","display_name":"Very-large-scale integration","score":0.10966163873672485}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.71732097864151},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.6959478259086609},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6750311851501465},{"id":"https://openalex.org/C150741067","wikidata":"https://www.wikidata.org/wiki/Q2377218","display_name":"Systolic array","level":3,"score":0.5636545419692993},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.5592122077941895},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.5320547223091125},{"id":"https://openalex.org/C124584101","wikidata":"https://www.wikidata.org/wiki/Q1053266","display_name":"Multiplier (economics)","level":2,"score":0.5074395537376404},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.5001819133758545},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4324647784233093},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4122586250305176},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3277202248573303},{"id":"https://openalex.org/C14580979","wikidata":"https://www.wikidata.org/wiki/Q876049","display_name":"Very-large-scale integration","level":2,"score":0.10966163873672485},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C139719470","wikidata":"https://www.wikidata.org/wiki/Q39680","display_name":"Macroeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asicon.2017.8252595","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asicon.2017.8252595","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE 12th International Conference on ASIC (ASICON)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6299999952316284,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W161315898","https://openalex.org/W1509443229","https://openalex.org/W1961164518","https://openalex.org/W2017369466","https://openalex.org/W2035476608","https://openalex.org/W2054388411","https://openalex.org/W2059003054","https://openalex.org/W2063186542","https://openalex.org/W2082292996","https://openalex.org/W2094139070","https://openalex.org/W2159789820","https://openalex.org/W3141650078"],"related_works":["https://openalex.org/W2022229285","https://openalex.org/W46448156","https://openalex.org/W2283084692","https://openalex.org/W2130878144","https://openalex.org/W3172158163","https://openalex.org/W2150609674","https://openalex.org/W2138404091","https://openalex.org/W3034729708","https://openalex.org/W2078475991","https://openalex.org/W1998203035"],"abstract_inverted_index":{"Matrix":[0],"operation":[1,117,124,163],"has":[2,48,93],"high":[3,107],"time":[4],"complexity":[5],"and":[6,22,161,182],"traditional":[7],"serial":[8],"algorithm":[9],"is":[10,67,120,153,158],"less":[11],"efficient.":[12],"In":[13,55,90],"the":[14,33,39,50,74,78,84,87,100,149,155,168,184],"existing":[15],"design":[16,70,129,177],"of":[17,35,52,102,116,125,173],"matrix":[18,36,65,123],"multiplication,":[19],"systolic":[20,174],"array":[21],"other":[23],"methods":[24],"are":[25],"usually":[26],"used":[27],"for":[28,62,96,122,135],"hardware":[29,59],"acceleration.":[30],"But":[31],"as":[32],"scale":[34,64],"computing":[37,79],"increases,":[38],"\u201cstorage":[40,103],"wall\u201d":[41],"problem":[42],"caused":[43],"by":[44],"data":[45,75,97],"throughput":[46],"bandwidth":[47,157,181],"become":[49],"bottleneck":[51],"performance":[53],"improvement.":[54],"this":[56],"paper,":[57],"a":[58],"accelerator":[60],"suitable":[61,121],"large":[63],"multiplication":[66],"proposed.":[68],"This":[69],"takes":[71],"non-buffering":[72],"organization,":[73],"entered":[76],"into":[77],"unit":[80],"directly":[81],"involved":[82],"in":[83,162],"operation,":[85],"reducing":[86],"storage":[88],"pressure.":[89],"addition,":[91],"it":[92],"low":[94],"demand":[95],"throughput,":[98],"avoiding":[99],"impact":[101],"wall\u201d,":[104],"while":[105],"maintaining":[106],"operational":[108,186],"performance.":[109,187],"The":[110,128],"multiplier":[111],"also":[112],"supports":[113],"on-line":[114],"configuration":[115],"scale,":[118],"which":[119,138],"different":[126],"scales.":[127],"was":[130],"performed":[131],"on":[132],"XC7V2000T":[133],"chip":[134],"prototype":[136],"verification,":[137],"can":[139],"integrate":[140],"up":[141],"to":[142],"1080":[143],"processing":[144,150,170],"elements.":[145],"After":[146],"testing,":[147],"when":[148],"elements":[151],"number":[152,172],"256,":[154],"peak":[156],"19.2":[159],"Gbit/s,":[160],"1k-order":[164],"matrix,":[165],"compared":[166],"with":[167],"same":[169,185],"element":[171],"structure,":[175],"our":[176],"compressed":[178],"1k":[179],"times":[180],"achieved":[183]},"counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
