{"id":"https://openalex.org/W4406794196","doi":"https://doi.org/10.1109/tc.2025.3533083","title":"Optimizing Structured-Sparse Matrix Multiplication in RISC-V Vector Processors","display_name":"Optimizing Structured-Sparse Matrix Multiplication in RISC-V Vector Processors","publication_year":2025,"publication_date":"2025-01-24","ids":{"openalex":"https://openalex.org/W4406794196","doi":"https://doi.org/10.1109/tc.2025.3533083"},"language":"en","primary_location":{"id":"doi:10.1109/tc.2025.3533083","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2025.3533083","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093264909","display_name":"Vasileios Titopoulos","orcid":"https://orcid.org/0009-0009-0123-5737"},"institutions":[{"id":"https://openalex.org/I147962203","display_name":"Democritus University of Thrace","ror":"https://ror.org/03bfqnx40","country_code":"GR","type":"education","lineage":["https://openalex.org/I147962203"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"Vasileios Titopoulos","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Democritus University of Thrace, Xanthi, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Democritus University of Thrace, Xanthi, Greece","institution_ids":["https://openalex.org/I147962203"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111262390","display_name":"Kosmas Alexandridis","orcid":null},"institutions":[{"id":"https://openalex.org/I147962203","display_name":"Democritus University of Thrace","ror":"https://ror.org/03bfqnx40","country_code":"GR","type":"education","lineage":["https://openalex.org/I147962203"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Kosmas Alexandridis","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Democritus University of Thrace, Xanthi, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Democritus University of Thrace, Xanthi, Greece","institution_ids":["https://openalex.org/I147962203"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063756965","display_name":"Christodoulos Peltekis","orcid":"https://orcid.org/0009-0000-8930-9431"},"institutions":[{"id":"https://openalex.org/I147962203","display_name":"Democritus University of Thrace","ror":"https://ror.org/03bfqnx40","country_code":"GR","type":"education","lineage":["https://openalex.org/I147962203"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Christodoulos Peltekis","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Democritus University of Thrace, Xanthi, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Democritus University of Thrace, Xanthi, Greece","institution_ids":["https://openalex.org/I147962203"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035714231","display_name":"Chrysostomos Nicopoulos","orcid":"https://orcid.org/0000-0001-6389-6068"},"institutions":[{"id":"https://openalex.org/I34771391","display_name":"University of Cyprus","ror":"https://ror.org/02qjrjx09","country_code":"CY","type":"education","lineage":["https://openalex.org/I34771391"]}],"countries":["CY"],"is_corresponding":false,"raw_author_name":"Chrysostomos Nicopoulos","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Cyprus, Nicosia, Cyprus"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Cyprus, Nicosia, Cyprus","institution_ids":["https://openalex.org/I34771391"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074704256","display_name":"Giorgos Dimitrakopoulos","orcid":"https://orcid.org/0000-0003-3688-7865"},"institutions":[{"id":"https://openalex.org/I147962203","display_name":"Democritus University of Thrace","ror":"https://ror.org/03bfqnx40","country_code":"GR","type":"education","lineage":["https://openalex.org/I147962203"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Giorgos Dimitrakopoulos","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Democritus University of Thrace, Xanthi, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Democritus University of Thrace, Xanthi, Greece","institution_ids":["https://openalex.org/I147962203"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5093264909"],"corresponding_institution_ids":["https://openalex.org/I147962203"],"apc_list":null,"apc_paid":null,"fwci":7.7276,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.9664954,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"74","issue":"4","first_page":"1446","last_page":"1460"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.65265291929245},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6289190053939819},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.5994759798049927},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.5973746180534363},{"id":"https://openalex.org/keywords/multiplication","display_name":"Multiplication (music)","score":0.4962530732154846},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.40147513151168823},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3290014863014221},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2478400468826294},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.11804661154747009},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.09282946586608887}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.65265291929245},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6289190053939819},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.5994759798049927},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.5973746180534363},{"id":"https://openalex.org/C2780595030","wikidata":"https://www.wikidata.org/wiki/Q3860309","display_name":"Multiplication (music)","level":2,"score":0.4962530732154846},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.40147513151168823},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3290014863014221},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2478400468826294},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.11804661154747009},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09282946586608887},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tc.2025.3533083","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2025.3533083","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1973918431","https://openalex.org/W1981985132","https://openalex.org/W1985263109","https://openalex.org/W2007259720","https://openalex.org/W2089437293","https://openalex.org/W2147657366","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2412662927","https://openalex.org/W2613264175","https://openalex.org/W2912046679","https://openalex.org/W2963446712","https://openalex.org/W2980186997","https://openalex.org/W2994193159","https://openalex.org/W2997005340","https://openalex.org/W3016842236","https://openalex.org/W3042944763","https://openalex.org/W3103168911","https://openalex.org/W3158543914","https://openalex.org/W3185702163","https://openalex.org/W3194242682","https://openalex.org/W4247008581","https://openalex.org/W4308083915","https://openalex.org/W4311486595","https://openalex.org/W4311995762","https://openalex.org/W4367721918","https://openalex.org/W4385623132","https://openalex.org/W4386859355","https://openalex.org/W4388581352","https://openalex.org/W4389500474","https://openalex.org/W4399732797","https://openalex.org/W4402917213","https://openalex.org/W6770699648","https://openalex.org/W6779824479","https://openalex.org/W6789946416","https://openalex.org/W6790503700","https://openalex.org/W6794457956"],"related_works":["https://openalex.org/W3099313426","https://openalex.org/W4287593139","https://openalex.org/W2057797376","https://openalex.org/W2090319426","https://openalex.org/W752783541","https://openalex.org/W2506252583","https://openalex.org/W1506547947","https://openalex.org/W4406620725","https://openalex.org/W2048249848","https://openalex.org/W2995605830"],"abstract_inverted_index":{"Structured":[0],"sparsity":[1,62],"has":[2],"been":[3],"proposed":[4,143,185],"as":[5,97],"an":[6],"efficient":[7],"way":[8],"to":[9,19,56,66],"prune":[10],"the":[11,21,58,69,74,81,98,104,113,129,159,166,203,207,211,215,219,228,249],"complexity":[12],"of":[13,23,60,76,100,115,131,168,221,230],"Machine":[14],"Learning":[15],"(ML)":[16],"applications":[17],"and":[18,106,112,122,163,206,214,238],"simplify":[20],"handling":[22],"sparse":[24],"data":[25,101,110],"in":[26,190],"hardware.":[27],"Accelerating":[28],"ML":[29],"models,":[30],"whether":[31],"for":[32,155,218],"training,":[33],"or":[34,49],"inference,":[35],"heavily":[36],"relies":[37],"on":[38,46],"matrix":[39,51,71,78,172],"multiplications":[40],"that":[41,93,128,179,246],"can":[42],"be":[43],"efficiently":[44],"executed":[45,170],"vector":[47,64,86,107,151,160,194],"processors,":[48],"custom":[50,232],"engines.":[52],"This":[53],"work":[54],"aims":[55],"integrate":[57],"simplicity":[59],"structured":[61],"into":[63],"execution":[65,220],"speed":[67],"up":[68],"corresponding":[70],"multiplications.":[72],"Initially,":[73],"implementation":[75],"structured-sparse":[77],"multiplication":[79,173],"using":[80],"current":[82],"RISC-V":[83,193,252],"instruction":[84,135,144,187,217,233],"set":[85],"extension":[87],"is":[88,126,145],"comprehensively":[89],"explored.":[90],"Critical":[91],"parameters":[92],"affect":[94],"performance,":[95],"such":[96],"impact":[99],"distribution":[102],"across":[103],"scalar":[105],"register":[108,161],"files,":[109],"locality,":[111],"effectiveness":[114],"loop":[116,182],"unrolling":[117],"are":[118],"analyzed":[119],"both":[120],"qualitatively":[121],"quantitatively.":[123],"Furthermore,":[124],"it":[125,164],"demonstrated":[127],"addition":[130,229],"a":[132,191,231],"single":[133],"new":[134,186,216],"would":[136,180],"reap":[137],"even":[138],"higher":[139],"performance.":[140],"The":[141,184],"newly":[142],"called":[146],"<monospace":[147],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[148],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">vindexmac</monospace>,":[149],"i.e.,":[150],"index-multiply-accumulate.":[152],"It":[153],"allows":[154],"indirect":[156],"reads":[157],"from":[158],"file":[162],"reduces":[165],"number":[167],"instructions":[169],"per":[171],"iteration,":[174],"without":[175],"introducing":[176],"additional":[177],"dependencies":[178],"limit":[181],"unrolling.":[183],"was":[188],"integrated":[189],"decoupled":[192],"processor":[195],"with":[196,242],"negligible":[197],"hardware":[198],"cost.":[199],"Experimental":[200],"results":[201],"demonstrate":[202],"runtime":[204,235],"efficiency":[205],"scalability":[208],"offered":[209],"by":[210,236],"introduced":[212],"optimizations":[213],"state-of-the-art":[222],"Convolutional":[223],"Neural":[224],"Networks.":[225],"More":[226],"particularly,":[227],"improves":[234],"25%":[237],"33%,":[239],"when":[240],"compared":[241],"highly-optimized":[243],"vectorized":[244],"kernels":[245],"use":[247],"only":[248],"currently":[250],"defined":[251],"instructions.":[253]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":3}],"updated_date":"2026-02-25T23:00:34.991745","created_date":"2025-10-10T00:00:00"}
