{"id":"https://openalex.org/W3202303936","doi":"https://doi.org/10.1145/3458744.3473352","title":"Support Convolution of CNN with Compression Sparse Matrix Multiplication Flow in TVM","display_name":"Support Convolution of CNN with Compression Sparse Matrix Multiplication Flow in TVM","publication_year":2021,"publication_date":"2021-08-09","ids":{"openalex":"https://openalex.org/W3202303936","doi":"https://doi.org/10.1145/3458744.3473352","mag":"3202303936"},"language":"en","primary_location":{"id":"doi:10.1145/3458744.3473352","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3458744.3473352","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"50th International Conference on Parallel Processing Workshop","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076915932","display_name":"Hui-Hsin Liao","orcid":"https://orcid.org/0000-0002-4674-9872"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Hui-Hsin Liao","raw_affiliation_strings":["National Tsing Hua University, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Tsing Hua University, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034885231","display_name":"Chao-Lin Lee","orcid":"https://orcid.org/0000-0002-4619-3843"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chao-Lin Lee","raw_affiliation_strings":["National Tsing Hua University, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Tsing Hua University, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038803698","display_name":"Jenq\u2010Kuen Lee","orcid":"https://orcid.org/0000-0001-9919-6258"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jenq-Kuen Lee","raw_affiliation_strings":["National Tsing Hua University, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Tsing Hua University, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039469651","display_name":"Wei\u2010Chih Lai","orcid":"https://orcid.org/0000-0003-2703-8845"},"institutions":[{"id":"https://openalex.org/I4210148979","display_name":"MediaTek (Taiwan)","ror":"https://ror.org/05g9jck81","country_code":"TW","type":"company","lineage":["https://openalex.org/I4210148979"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Wei-Chih Lai","raw_affiliation_strings":["MediaTek Inc, Taiwan"],"affiliations":[{"raw_affiliation_string":"MediaTek Inc, Taiwan","institution_ids":["https://openalex.org/I4210148979"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072319470","display_name":"Ming-Yu Hung","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148979","display_name":"MediaTek (Taiwan)","ror":"https://ror.org/05g9jck81","country_code":"TW","type":"company","lineage":["https://openalex.org/I4210148979"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Ming-Yu Hung","raw_affiliation_strings":["MediaTek Inc, Taiwan"],"affiliations":[{"raw_affiliation_string":"MediaTek Inc, Taiwan","institution_ids":["https://openalex.org/I4210148979"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009835723","display_name":"Chung-Wen Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148979","display_name":"MediaTek (Taiwan)","ror":"https://ror.org/05g9jck81","country_code":"TW","type":"company","lineage":["https://openalex.org/I4210148979"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chung-Wen Huang","raw_affiliation_strings":["MediaTek Inc, Taiwan"],"affiliations":[{"raw_affiliation_string":"MediaTek Inc, Taiwan","institution_ids":["https://openalex.org/I4210148979"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5076915932"],"corresponding_institution_ids":["https://openalex.org/I25846049"],"apc_list":null,"apc_paid":null,"fwci":0.7685,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.73846405,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.794553279876709},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.7258611917495728},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.710637092590332},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.6143232583999634},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.5584389567375183},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5477511286735535},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.5420549511909485},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5294411182403564},{"id":"https://openalex.org/keywords/flow","display_name":"Flow (mathematics)","score":0.4986753463745117},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.48214027285575867},{"id":"https://openalex.org/keywords/multiplication","display_name":"Multiplication (music)","score":0.48016825318336487},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.4599100947380066},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.4498825669288635},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.44793522357940674},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4396994113922119},{"id":"https://openalex.org/keywords/edge-computing","display_name":"Edge computing","score":0.4242382049560547},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3557230830192566},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3495240807533264},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.346911758184433},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1015520989894867}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.794553279876709},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.7258611917495728},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.710637092590332},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.6143232583999634},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.5584389567375183},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5477511286735535},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.5420549511909485},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5294411182403564},{"id":"https://openalex.org/C38349280","wikidata":"https://www.wikidata.org/wiki/Q1434290","display_name":"Flow (mathematics)","level":2,"score":0.4986753463745117},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.48214027285575867},{"id":"https://openalex.org/C2780595030","wikidata":"https://www.wikidata.org/wiki/Q3860309","display_name":"Multiplication (music)","level":2,"score":0.48016825318336487},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.4599100947380066},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.4498825669288635},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.44793522357940674},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4396994113922119},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.4242382049560547},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3557230830192566},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3495240807533264},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.346911758184433},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1015520989894867},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3458744.3473352","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3458744.3473352","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"50th International Conference on Parallel Processing Workshop","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5899999737739563,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1845051632","https://openalex.org/W2000545491","https://openalex.org/W2006295906","https://openalex.org/W2080353445","https://openalex.org/W2108598243","https://openalex.org/W2112984492","https://openalex.org/W2117539524","https://openalex.org/W2271840356","https://openalex.org/W2507318699","https://openalex.org/W2513419314","https://openalex.org/W2515385951","https://openalex.org/W2605739168","https://openalex.org/W2743200750","https://openalex.org/W2754249189","https://openalex.org/W2780077279","https://openalex.org/W2785856116","https://openalex.org/W2805566098","https://openalex.org/W2945098486","https://openalex.org/W2949245006","https://openalex.org/W2949650786","https://openalex.org/W2955301920","https://openalex.org/W2963343843","https://openalex.org/W2963751813","https://openalex.org/W2981972129","https://openalex.org/W2996874060","https://openalex.org/W3091174280","https://openalex.org/W3098220359","https://openalex.org/W3104849992","https://openalex.org/W3118608800"],"related_works":["https://openalex.org/W4322761281","https://openalex.org/W4238233472","https://openalex.org/W4313526662","https://openalex.org/W2293771254","https://openalex.org/W4312996489","https://openalex.org/W3111395152","https://openalex.org/W3106131444","https://openalex.org/W3216099748","https://openalex.org/W4205963435","https://openalex.org/W4221142455"],"abstract_inverted_index":{"Recently,":[0],"machine":[1],"learning":[2,49],"has":[3],"been":[4],"widely":[5],"adopted":[6],"in":[7,11,77,88,109,122],"various":[8],"scenarios,":[9],"especially":[10],"edge":[12,15],"devices.":[13],"These":[14],"devices,":[16,22],"such":[17],"as":[18],"smartphones":[19],"or":[20,59],"IoT":[21],"are":[23,56,114],"usually":[24],"powered":[25],"by":[26,140],"limited":[27],"batteries.":[28],"Therefore,":[29,91],"how":[30],"to":[31,62,98,166],"increase":[32],"performance":[33],"and":[34,144],"achieve":[35,156],"power":[36],"savings":[37],"become":[38],"one":[39,81],"of":[40,47,82,106],"the":[41,45,52,74,83,93,99,104,111,138,146,167],"critical":[42],"issues":[43],"during":[44],"development":[46],"deep":[48],"frameworks.":[50],"In":[51,68,133],"research":[53],"efforts,":[54],"there":[55],"numerous":[57],"optimizations":[58],"methodologies":[60],"developed":[61],"aim":[63],"at":[64],"improving":[65,92],"CNN":[66],"performance.":[67],"this":[69],"paper,":[70],"we":[71,136],"focus":[72],"on":[73,159],"convolution":[75,94,128],"layer":[76],"CNN,":[78],"which":[79,110,124],"is":[80],"most":[84],"computationally":[85],"demanding":[86],"operators":[87],"neural":[89],"networks.":[90],"will":[95],"contribute":[96],"significantly":[97],"entire":[100],"model.":[101,147],"We":[102,118],"find":[103],"opportunities":[105],"sparse":[107,127],"convolution,":[108],"certain":[112,142],"matrices":[113],"with":[115,130,161],"high":[116],"sparsity.":[117],"proposed":[119,150],"a":[120,126],"flow":[121,129],"TVM,":[123],"provides":[125],"weight":[131,143],"pruning.":[132],"our":[134,149],"flow,":[135,151],"maximize":[137],"sparsity":[139],"pruning":[141],"pertaining":[145],"With":[148],"TVM":[152],"model":[153],"runtime":[154],"could":[155],"11.42x":[157],"speedup":[158],"average":[160],"ImageNet":[162],"based":[163],"models":[164],"compared":[165],"original":[168],"flow.":[169]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
