{"id":"https://openalex.org/W4319348870","doi":"https://doi.org/10.1145/3580315","title":"Performance Implication of Tensor Irregularity and Optimization for Distributed Tensor Decomposition","display_name":"Performance Implication of Tensor Irregularity and Optimization for Distributed Tensor Decomposition","publication_year":2023,"publication_date":"2023-02-07","ids":{"openalex":"https://openalex.org/W4319348870","doi":"https://doi.org/10.1145/3580315"},"language":"en","primary_location":{"id":"doi:10.1145/3580315","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580315","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031204113","display_name":"Zheng Miao","orcid":"https://orcid.org/0000-0001-6084-2793"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zheng Miao","raw_affiliation_strings":["Hangzhou Dianzi University, China"],"affiliations":[{"raw_affiliation_string":"Hangzhou Dianzi University, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003772863","display_name":"Jon C. Calhoun","orcid":"https://orcid.org/0000-0001-7191-4422"},"institutions":[{"id":"https://openalex.org/I8078737","display_name":"Clemson University","ror":"https://ror.org/037s24f05","country_code":"US","type":"education","lineage":["https://openalex.org/I8078737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jon C. Calhoun","raw_affiliation_strings":["Clemson University, USA"],"affiliations":[{"raw_affiliation_string":"Clemson University, USA","institution_ids":["https://openalex.org/I8078737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035001911","display_name":"Rong Ge","orcid":"https://orcid.org/0000-0002-2218-3675"},"institutions":[{"id":"https://openalex.org/I8078737","display_name":"Clemson University","ror":"https://ror.org/037s24f05","country_code":"US","type":"education","lineage":["https://openalex.org/I8078737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rong Ge","raw_affiliation_strings":["Clemson University, USA"],"affiliations":[{"raw_affiliation_string":"Clemson University, USA","institution_ids":["https://openalex.org/I8078737"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100454305","display_name":"Jiajia Li","orcid":"https://orcid.org/0000-0003-1270-4147"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiajia Li","raw_affiliation_strings":["North Carolina State University, USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, USA","institution_ids":["https://openalex.org/I137902535"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5031204113"],"corresponding_institution_ids":["https://openalex.org/I50760025"],"apc_list":null,"apc_paid":null,"fwci":0.217,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.35024155,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"10","issue":"2","first_page":"1","last_page":"27"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11304","display_name":"Advanced Neuroimaging Techniques and Applications","score":0.9652000069618225,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.958899974822998,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.8094854950904846},{"id":"https://openalex.org/keywords/tensor","display_name":"Tensor (intrinsic definition)","score":0.772381603717804},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7132800817489624},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.6802404522895813},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.5181690454483032},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.47002625465393066},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.4685657322406769},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4258388578891754},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.42392072081565857},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.41741642355918884},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.41208600997924805},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3823997676372528},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.33543673157691956},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.22861766815185547},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1772545874118805}],"concepts":[{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.8094854950904846},{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.772381603717804},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7132800817489624},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.6802404522895813},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.5181690454483032},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.47002625465393066},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.4685657322406769},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4258388578891754},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.42392072081565857},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.41741642355918884},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.41208600997924805},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3823997676372528},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.33543673157691956},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.22861766815185547},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1772545874118805},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3580315","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580315","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5022414008","display_name":null,"funder_award_id":"SHF-1910197, SHF-1943114, CCF-155151, and OAC-2204011","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W111803032","https://openalex.org/W1574504252","https://openalex.org/W1798945469","https://openalex.org/W1825959699","https://openalex.org/W1963826206","https://openalex.org/W1969116741","https://openalex.org/W2024165284","https://openalex.org/W2056999868","https://openalex.org/W2079487069","https://openalex.org/W2103392911","https://openalex.org/W2105724942","https://openalex.org/W2131613942","https://openalex.org/W2138388932","https://openalex.org/W2246859513","https://openalex.org/W2559655401","https://openalex.org/W2565436413","https://openalex.org/W2604652149","https://openalex.org/W2616934551","https://openalex.org/W2768445292","https://openalex.org/W2788854599","https://openalex.org/W2805781225","https://openalex.org/W2885990458","https://openalex.org/W2886539428","https://openalex.org/W2902783593","https://openalex.org/W2911694715","https://openalex.org/W2924040443","https://openalex.org/W2964051974","https://openalex.org/W2986686333","https://openalex.org/W2991157588","https://openalex.org/W3002017272","https://openalex.org/W3047192504","https://openalex.org/W3099762987","https://openalex.org/W3131137184","https://openalex.org/W3164929383","https://openalex.org/W4239025233","https://openalex.org/W6638060716"],"related_works":["https://openalex.org/W3152165845","https://openalex.org/W1654043760","https://openalex.org/W2569661359","https://openalex.org/W2950186459","https://openalex.org/W2170114491","https://openalex.org/W2897298721","https://openalex.org/W2242624680","https://openalex.org/W2136127937","https://openalex.org/W4290987221","https://openalex.org/W2216309014"],"abstract_inverted_index":{"Tensors":[0],"are":[1,15],"used":[2],"by":[3,318],"a":[4,16,49,198,212],"wide":[5],"variety":[6],"of":[7,18,30,66,84,89,93,164,173,176,197,222,355],"applications":[8,32],"to":[9,142,190,249,320],"represent":[10],"multi-dimensional":[11],"data;":[12],"tensor":[13,52,140,200,335],"decompositions":[14],"class":[17],"methods":[19],"for":[20,54,68,106,123,146,230,353],"latent":[21,56],"data":[22,24],"analytics,":[23],"compression,":[25],"and":[26,40,63,82,91,113,121,155,168,178,180,183,185,194,211,246,273,286,288,310,314,323,345,349],"so":[27],"on.":[28],"Many":[29],"these":[31],"generate":[33],"large":[34,69],"tensors":[35,70,85,107,125],"with":[36,108,257,265],"irregular":[37,124,147,231],"dimension":[38,111,209],"sizes":[39,112,210],"nonzero":[41,114,214],"distribution.":[42,215],"CANDECOMP/PARAFAC":[43],"decomposition":[44,53],"(":[45],"Cpd":[46,67,105,166,241,306],")":[47],"is":[48,170,201,307],"popular":[50],"low-rank":[51],"discovering":[55],"features.":[57],"The":[58,80,297],"increasing":[59],"overhead":[60,130],"on":[61,138,204,218,326],"memory":[62,73,95],"execution":[64],"time":[65,129,259],"requires":[71],"distributed":[72,94,240,305,316],"implementations":[74,317],"as":[75,338],"the":[76,87,161,171,244,251,263,269,278,281,289,293,312],"only":[77],"feasible":[78],"solution.":[79],"sparsity":[81,184,245],"irregularity":[83,186,247],"hinder":[86],"improvement":[88],"performance":[90,120,167],"scalability":[92,122,169,352],"implementations.":[96],"While":[97],"previous":[98],"works":[99],"have":[100],"been":[101],"proved":[102],"successful":[103],"in":[104,131],"relatively":[109],"regular":[110],"distribution,":[115],"they":[116],"either":[117],"deliver":[118],"unsatisfactory":[119],"or":[126],"require":[127],"significant":[128],"preprocessing.":[132],"In":[133],"this":[134],"work,":[135],"we":[136,237],"focus":[137],"medium-grained":[139],"distribution":[141,275],"address":[143,234],"their":[144,181,192],"limitation":[145],"tensors.":[148,232],"We":[149,158,261],"first":[150],"thoroughly":[151],"investigate":[152],"through":[153],"theoretical":[154],"experimental":[156,298],"analysis.":[157],"disclose":[159],"that":[160,242,301],"main":[162],"cause":[163],"poor":[165],"imbalance":[172,224],"multiple":[174],"types":[175],"computations":[177,285],"communications":[179],"tradeoffs;":[182],"make":[187],"it":[188],"challenging":[189],"achieve":[191],"balances":[193,294],"tradeoffs.":[195],"Irregularity":[196],"sparse":[199,334,340],"categorized":[202],"based":[203],"two":[205,266],"aspects:":[206],"very":[207],"different":[208,255,333],"non-uniform":[213],"Typically,":[216],"focusing":[217],"optimizing":[219],"one":[220],"type":[221],"load":[223],"causes":[225],"other":[226],"ones":[227],"more":[228,308],"severe":[229],"To":[233],"such":[235,337],"challenges,":[236],"propose":[238],"irregularity-aware":[239,304],"leverages":[243],"information":[248],"identify":[250],"best":[252],"tradeoff":[253],"between":[254],"imbalances":[256],"low":[258],"overhead.":[260],"materialize":[262],"idea":[264],"optimization":[267],"methods:":[268],"prediction-based":[270],"grid":[271],"configuration":[272],"matrix-oriented":[274],"policy,":[276],"where":[277],"former":[279],"forms":[280],"global":[282],"balance":[283],"among":[284,295],"communications,":[287],"latter":[290],"further":[291],"adjusts":[292],"computations.":[296],"results":[299],"show":[300],"our":[302],"proposed":[303],"scalable":[309],"outperforms":[311],"medium-":[313],"fine-grained":[315],"up":[319],"4.4":[321],"\u00d7":[322,325],"11.4":[324],"1,536":[327],"processors,":[328],"respectively.":[329],"Our":[330],"optimizations":[331],"support":[332],"formats,":[336],"compressed":[339],"fiber":[341],"(CSF),":[342],"coordinate":[343],"(COO),":[344],"Hierarchical":[346],"Coordinate":[347],"(HiCOO),":[348],"gain":[350],"good":[351],"all":[354],"them.":[356]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
