{"id":"https://openalex.org/W4292862735","doi":"https://doi.org/10.1109/mwscas54063.2022.9859440","title":"Hardware Acceleration in Large-Scale Tensor Decomposition for Neural Network Compression","display_name":"Hardware Acceleration in Large-Scale Tensor Decomposition for Neural Network Compression","publication_year":2022,"publication_date":"2022-08-07","ids":{"openalex":"https://openalex.org/W4292862735","doi":"https://doi.org/10.1109/mwscas54063.2022.9859440"},"language":"en","primary_location":{"id":"doi:10.1109/mwscas54063.2022.9859440","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mwscas54063.2022.9859440","pdf_url":null,"source":{"id":"https://openalex.org/S4363606568","display_name":"2022 IEEE 65th International Midwest Symposium on Circuits and Systems (MWSCAS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE 65th International Midwest Symposium on Circuits and Systems (MWSCAS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110739049","display_name":"C.-L. Kao","orcid":null},"institutions":[{"id":"https://openalex.org/I16733864","display_name":"National Taiwan University","ror":"https://ror.org/05bqach95","country_code":"TW","type":"education","lineage":["https://openalex.org/I16733864"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chen-Chien Kao","raw_affiliation_strings":["National Taiwan University,Graduate Institute of Electronics Engineering,Taipei,Taiwan","Graduate Institute of Electronics Engineering, National Taiwan University, Taipei, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taiwan University,Graduate Institute of Electronics Engineering,Taipei,Taiwan","institution_ids":["https://openalex.org/I16733864"]},{"raw_affiliation_string":"Graduate Institute of Electronics Engineering, National Taiwan University, Taipei, Taiwan","institution_ids":["https://openalex.org/I16733864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043326737","display_name":"Yi-Yen Hsieh","orcid":"https://orcid.org/0000-0002-4481-5848"},"institutions":[{"id":"https://openalex.org/I16733864","display_name":"National Taiwan University","ror":"https://ror.org/05bqach95","country_code":"TW","type":"education","lineage":["https://openalex.org/I16733864"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yi-Yen Hsieh","raw_affiliation_strings":["National Taiwan University,Graduate Institute of Electronics Engineering,Taipei,Taiwan","Graduate Institute of Electronics Engineering, National Taiwan University, Taipei, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taiwan University,Graduate Institute of Electronics Engineering,Taipei,Taiwan","institution_ids":["https://openalex.org/I16733864"]},{"raw_affiliation_string":"Graduate Institute of Electronics Engineering, National Taiwan University, Taipei, Taiwan","institution_ids":["https://openalex.org/I16733864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102176313","display_name":"Chao-Hung Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148468","display_name":"Industrial Technology Research Institute","ror":"https://ror.org/05szzwt63","country_code":"TW","type":"nonprofit","lineage":["https://openalex.org/I4210148468"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chao-Hung Chen","raw_affiliation_strings":["Industrial Technology Research Institute,Hsinchu,Taiwan","Industrial Technology Research Institute, Hsinchu, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Industrial Technology Research Institute,Hsinchu,Taiwan","institution_ids":["https://openalex.org/I4210148468"]},{"raw_affiliation_string":"Industrial Technology Research Institute, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I4210148468"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101750729","display_name":"Chia\u2010Hsiang Yang","orcid":"https://orcid.org/0000-0003-1163-321X"},"institutions":[{"id":"https://openalex.org/I16733864","display_name":"National Taiwan University","ror":"https://ror.org/05bqach95","country_code":"TW","type":"education","lineage":["https://openalex.org/I16733864"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chia-Hsiang Yang","raw_affiliation_strings":["National Taiwan University,Graduate Institute of Electronics Engineering,Taipei,Taiwan","Graduate Institute of Electronics Engineering, National Taiwan University, Taipei, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taiwan University,Graduate Institute of Electronics Engineering,Taipei,Taiwan","institution_ids":["https://openalex.org/I16733864"]},{"raw_affiliation_string":"Graduate Institute of Electronics Engineering, National Taiwan University, Taipei, Taiwan","institution_ids":["https://openalex.org/I16733864"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08695652,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.920799970626831,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/tensor","display_name":"Tensor (intrinsic definition)","score":0.5997294187545776},{"id":"https://openalex.org/keywords/hadamard-transform","display_name":"Hadamard transform","score":0.5905527472496033},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5585517883300781},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.5209521055221558},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.49739912152290344},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4941735565662384},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.4718475341796875},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.46768811345100403},{"id":"https://openalex.org/keywords/discrete-cosine-transform","display_name":"Discrete cosine transform","score":0.4457802176475525},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.438557893037796},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3912971615791321},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3046201467514038},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.16786974668502808},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.15894818305969238},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.13879325985908508},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.12219232320785522},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.09618830680847168},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.08363229036331177}],"concepts":[{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.5997294187545776},{"id":"https://openalex.org/C60292330","wikidata":"https://www.wikidata.org/wiki/Q1014065","display_name":"Hadamard transform","level":2,"score":0.5905527472496033},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5585517883300781},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.5209521055221558},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.49739912152290344},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4941735565662384},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4718475341796875},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.46768811345100403},{"id":"https://openalex.org/C2221639","wikidata":"https://www.wikidata.org/wiki/Q2877","display_name":"Discrete cosine transform","level":3,"score":0.4457802176475525},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.438557893037796},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3912971615791321},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3046201467514038},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16786974668502808},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.15894818305969238},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.13879325985908508},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.12219232320785522},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.09618830680847168},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.08363229036331177}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mwscas54063.2022.9859440","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mwscas54063.2022.9859440","pdf_url":null,"source":{"id":"https://openalex.org/S4363606568","display_name":"2022 IEEE 65th International Midwest Symposium on Circuits and Systems (MWSCAS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE 65th International Midwest Symposium on Circuits and Systems (MWSCAS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.8899999856948853,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320309618","display_name":"Ministry of Science and Technology","ror":"https://ror.org/02b207r52"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W2024165284","https://openalex.org/W2025603201","https://openalex.org/W2047680880","https://openalex.org/W2469230926","https://openalex.org/W2475965870","https://openalex.org/W2582365613","https://openalex.org/W2963048316","https://openalex.org/W3095508601","https://openalex.org/W3102869303","https://openalex.org/W3171753205","https://openalex.org/W4220761057","https://openalex.org/W6679667936"],"related_works":["https://openalex.org/W1916685473","https://openalex.org/W2055682261","https://openalex.org/W1993363272","https://openalex.org/W2186390138","https://openalex.org/W2060035984","https://openalex.org/W2790129917","https://openalex.org/W1982241170","https://openalex.org/W2992856432","https://openalex.org/W2116282083","https://openalex.org/W2100638064"],"abstract_inverted_index":{"A":[0,63],"tensor":[1,20,27,114,133],"is":[2,7,75,110],"a":[3,18,30,117,142],"multi-dimensional":[4],"array,":[5],"which":[6],"embedded":[8],"for":[9,59,90,97,132],"neural":[10,60],"networks.":[11],"The":[12,107],"multiply-accumulate":[13],"(MAC)":[14],"operations":[15],"involved":[16],"in":[17,56],"large-scale":[19,57],"introduces":[21],"high":[22],"computational":[23,34],"complexity.":[24],"Since":[25],"the":[26,33,68,79,88,99,128,147],"usually":[28],"features":[29],"low":[31],"rank,":[32],"complexity":[35],"can":[36],"be":[37],"largely":[38],"reduced":[39],"through":[40],"canonical":[41],"polyadic":[42],"decomposition":[43,115],"(CPD).":[44],"This":[45],"work":[46,136],"presents":[47],"an":[48],"energy-efficient":[49],"hardware":[50],"accelerator":[51,109],"that":[52,66],"implements":[53],"randomized":[54],"CPD":[55],"tensors":[58,139],"network":[61],"compression.":[62],"mixing":[64],"method":[65],"combines":[67],"Walsh-Hadamard":[69],"transform":[70,74,82],"and":[71,140],"discrete":[72],"cosine":[73],"proposed":[76,108],"to":[77,112,121,127],"replace":[78],"fast":[80],"Fourier":[81],"with":[83,116],"faster":[84],"convergence.":[85],"It":[86],"reduces":[87],"computations":[89,96],"transformation":[91],"by":[92],"83%.":[93],"75%":[94],"of":[95,119],"solving":[98],"required":[100],"least":[101],"squares":[102],"problem":[103],"are":[104],"also":[105],"reduced.":[106],"flexible":[111],"support":[113,137],"size":[118],"up":[120],"$512\\times":[122],"512\\times":[123],"9\\times":[124],"9$.":[125],"Compared":[126],"prior":[129],"dedicated":[130],"processor":[131],"computation,":[134],"this":[135],"larger":[138],"achieves":[141],"$112\\times$":[143],"lower":[144],"latency":[145],"given":[146],"same":[148],"condition.":[149]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
