{"id":"https://openalex.org/W7124840614","doi":"https://doi.org/10.1109/cloudcom67567.2025.11331331","title":"An All-Reduce Compatible Top-$K$ Compressor for Communication-Efficient Distributed Learning","display_name":"An All-Reduce Compatible Top-$K$ Compressor for Communication-Efficient Distributed Learning","publication_year":2025,"publication_date":"2025-11-14","ids":{"openalex":"https://openalex.org/W7124840614","doi":"https://doi.org/10.1109/cloudcom67567.2025.11331331"},"language":null,"primary_location":{"id":"doi:10.1109/cloudcom67567.2025.11331331","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cloudcom67567.2025.11331331","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 lEEE International Conference on Cloud Computing Technology and Science (CloudCom)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Chuyan Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chuyan Chen","raw_affiliation_strings":["Peking University Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123434389","display_name":"Chenyang Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenyang Ma","raw_affiliation_strings":["Peking University Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053039986","display_name":"Zhangxin Li","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhangxin Li","raw_affiliation_strings":["Peking University Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100308027","display_name":"Yutong He","orcid":"https://orcid.org/0009-0002-5078-6454"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yutong He","raw_affiliation_strings":["Peking University Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123411329","display_name":"Yanjie Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanjie Dong","raw_affiliation_strings":["Shenzhen MSU-BIT University,Shenzhen,P. R. China"],"affiliations":[{"raw_affiliation_string":"Shenzhen MSU-BIT University,Shenzhen,P. R. China","institution_ids":["https://openalex.org/I4210152380","https://openalex.org/I180726961"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123381169","display_name":"Kun Yuan","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kun Yuan","raw_affiliation_strings":["Peking University Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.68861552,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.14830000698566437,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.14830000698566437,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.12370000034570694,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.09929999709129333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7382000088691711},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6495000123977661},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6123999953269958},{"id":"https://openalex.org/keywords/gas-compressor","display_name":"Gas compressor","score":0.5705999732017517},{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.553600013256073},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.42329999804496765},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.4146000146865845}],"concepts":[{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7382000088691711},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7138000130653381},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6495000123977661},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6123999953269958},{"id":"https://openalex.org/C131097465","wikidata":"https://www.wikidata.org/wiki/Q178898","display_name":"Gas compressor","level":2,"score":0.5705999732017517},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.553600013256073},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.42329999804496765},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.4146000146865845},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.40709999203681946},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.3747999966144562},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.35249999165534973},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2946999967098236},{"id":"https://openalex.org/C163415756","wikidata":"https://www.wikidata.org/wiki/Q126473","display_name":"Contraction (grammar)","level":2,"score":0.2928999960422516},{"id":"https://openalex.org/C130120984","wikidata":"https://www.wikidata.org/wiki/Q2835898","display_name":"Distributed algorithm","level":2,"score":0.2761000096797943},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27300000190734863},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.2703999876976013},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2630999982357025},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.2572000026702881},{"id":"https://openalex.org/C70061542","wikidata":"https://www.wikidata.org/wiki/Q989016","display_name":"Distributed database","level":2,"score":0.25609999895095825}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cloudcom67567.2025.11331331","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cloudcom67567.2025.11331331","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 lEEE International Conference on Cloud Computing Technology and Science (CloudCom)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2041517243","https://openalex.org/W2194775991","https://openalex.org/W2407022425","https://openalex.org/W2416799949","https://openalex.org/W2568772110","https://openalex.org/W2950865323","https://openalex.org/W2965373594","https://openalex.org/W2995022099","https://openalex.org/W4387544248","https://openalex.org/W4408182971"],"related_works":[],"abstract_inverted_index":{"Communication":[0],"remains":[1],"a":[2,16,73],"central":[3],"bottleneck":[4],"in":[5,37],"large-scale":[6],"distributed":[7],"machine":[8],"learning,":[9],"and":[10,34,51,105,135],"gradient":[11,25],"sparsi-fication":[12],"has":[13],"emerged":[14],"as":[15],"promising":[17],"strategy":[18],"to":[19,130],"alleviate":[20],"this":[21,57],"challenge.":[22],"However,":[23],"existing":[24],"compressors":[26],"face":[27],"notable":[28],"limitations:":[29],"Rand-K":[30,143],"discards":[31],"structural":[32],"information":[33],"per-forms":[35],"poorly":[36],"practice,":[38],"while":[39,82,123],"Top-<tex":[40,149],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[41,89,150],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$K$</tex>":[42,90],"preserves":[43],"informative":[44],"entries":[45],"but":[46],"loses":[47],"the":[48,77,110,119,140,145],"contraction":[49],"property":[50],"requires":[52],"costly":[53],"All-Gather":[54],"operations.":[55],"In":[56],"paper,":[58],"we":[59],"propose":[60],"ARC-Top-K,":[61],"an":[62,133],"All-Reduce-Compatible":[63],"Top-K":[64,122],"compressor":[65],"that":[66,138],"aligns":[67],"sparsity":[68],"patterns":[69],"across":[70],"nodes":[71],"using":[72],"lightweight":[74],"sketch":[75],"of":[76,121,142,148],"gradient,":[78],"enabling":[79],"index-free":[80],"All-Reduce":[81],"preserving":[83],"globally":[84],"significant":[85],"information.":[86],"ARC-Top-":[87],"<tex":[88],"is":[91],"provably":[92],"con-tractive":[93],"and,":[94],"when":[95],"combined":[96],"with":[97,144],"momentum":[98],"error":[99],"feedback":[100],"(EF21M),":[101],"achieves":[102],"linear":[103],"speedup":[104],"sharper":[106],"convergence":[107],"rates":[108],"than":[109],"original":[111],"EF21M":[112],"under":[113],"standard":[114],"assumptions.":[115],"Empirically,":[116],"ARC-Top-K":[117],"matches":[118],"accuracy":[120],"reducing":[124],"wall-clock":[125],"training":[126],"time":[127],"by":[128],"up":[129],"60.7%,":[131],"offering":[132],"efficient":[134],"scalable":[136],"solution":[137],"combines":[139],"robustness":[141],"strong":[146],"performance":[147],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$K$</tex>.":[151]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-01-21T00:00:00"}
