{"id":"https://openalex.org/W7124872707","doi":"https://doi.org/10.1109/cloudcom67567.2025.11331531","title":"Greedy Low-Rank Gradient Compression Provably Converges for Distributed Learning","display_name":"Greedy Low-Rank Gradient Compression Provably Converges for Distributed Learning","publication_year":2025,"publication_date":"2025-11-14","ids":{"openalex":"https://openalex.org/W7124872707","doi":"https://doi.org/10.1109/cloudcom67567.2025.11331531"},"language":null,"primary_location":{"id":"doi:10.1109/cloudcom67567.2025.11331531","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cloudcom67567.2025.11331531","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 lEEE International Conference on Cloud Computing Technology and Science (CloudCom)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Chuyan Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chuyan Chen","raw_affiliation_strings":["Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100308027","display_name":"Yutong He","orcid":"https://orcid.org/0009-0002-5078-6454"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yutong He","raw_affiliation_strings":["Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100439832","display_name":"Pei Li","orcid":"https://orcid.org/0000-0001-8699-8825"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengrui Li","raw_affiliation_strings":["Beihang University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beihang University,Beijing,China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123415370","display_name":"Weichen Jia","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weichen Jia","raw_affiliation_strings":["Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123408082","display_name":"Yanjie Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]},{"id":"https://openalex.org/I4388482657","display_name":"Shenzhen MSU-BIT University","ror":"https://ror.org/02q963474","country_code":null,"type":"education","lineage":["https://openalex.org/I4388482657"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanjie Dong","raw_affiliation_strings":["Shenzhen MSU-BIT University,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen MSU-BIT University,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380","https://openalex.org/I4388482657"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123381169","display_name":"Kun Yuan","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kun Yuan","raw_affiliation_strings":["Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":2.5513,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.93817279,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.4903999865055084,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.4903999865055084,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.4853000044822693,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.0032999999821186066,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/greedy-randomized-adaptive-search-procedure","display_name":"Greedy randomized adaptive search procedure","score":0.6485999822616577},{"id":"https://openalex.org/keywords/rate-of-convergence","display_name":"Rate of convergence","score":0.5968999862670898},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.585099995136261},{"id":"https://openalex.org/keywords/greedy-algorithm","display_name":"Greedy algorithm","score":0.5541999936103821},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.5192000269889832},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.5171999931335449},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.46399998664855957},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.44999998807907104}],"concepts":[{"id":"https://openalex.org/C126221529","wikidata":"https://www.wikidata.org/wiki/Q3116070","display_name":"Greedy randomized adaptive search procedure","level":3,"score":0.6485999822616577},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6359999775886536},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.5968999862670898},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.585099995136261},{"id":"https://openalex.org/C51823790","wikidata":"https://www.wikidata.org/wiki/Q504353","display_name":"Greedy algorithm","level":2,"score":0.5541999936103821},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.5192000269889832},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.5171999931335449},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.47130000591278076},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.46399998664855957},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.45570001006126404},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.44999998807907104},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.43220001459121704},{"id":"https://openalex.org/C130120984","wikidata":"https://www.wikidata.org/wiki/Q2835898","display_name":"Distributed algorithm","level":2,"score":0.3982999920845032},{"id":"https://openalex.org/C17020691","wikidata":"https://www.wikidata.org/wiki/Q139677","display_name":"Operator (biology)","level":5,"score":0.3970000147819519},{"id":"https://openalex.org/C124851039","wikidata":"https://www.wikidata.org/wiki/Q2665459","display_name":"Compressed sensing","level":2,"score":0.3677999973297119},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.3361999988555908},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.31859999895095825},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.31310001015663147},{"id":"https://openalex.org/C128669082","wikidata":"https://www.wikidata.org/wiki/Q583461","display_name":"Randomized algorithm","level":2,"score":0.2955000102519989},{"id":"https://openalex.org/C115680565","wikidata":"https://www.wikidata.org/wiki/Q5977448","display_name":"Gradient method","level":2,"score":0.287200003862381}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cloudcom67567.2025.11331531","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cloudcom67567.2025.11331531","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 lEEE International Conference on Cloud Computing Technology and Science (CloudCom)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W1788292158","https://openalex.org/W2194775991","https://openalex.org/W2407022425","https://openalex.org/W2416799949","https://openalex.org/W2923014074","https://openalex.org/W2950865323","https://openalex.org/W4387544248","https://openalex.org/W4408182971"],"related_works":[],"abstract_inverted_index":{"Distributed":[0],"optimization":[1],"is":[2],"pivotal":[3],"for":[4,91,152],"large-scale":[5],"signal":[6],"processing":[7],"and":[8,59,109],"machine":[9],"learning,":[10],"yet":[11],"communication":[12],"overhead":[13],"remains":[14,120],"a":[15,35,111,133],"major":[16],"bottleneck.":[17],"Low-rank":[18],"gradient":[19,88,154],"com-pression,":[20],"in":[21],"which":[22],"the":[23,66,103,117,146],"transmitted":[24],"gradients":[25,51],"are":[26,158],"approximated":[27],"by":[28,106],"low-rank":[29,153],"matrices":[30],"to":[31,101,160],"reduce":[32],"communication,":[33],"offers":[34],"promising":[36],"remedy.":[37],"Existing":[38],"methods":[39,64],"typically":[40],"adopt":[41],"either":[42],"randomized":[43,48],"or":[44],"greedy":[45,63,107],"compression":[46,89,108],"strategies:":[47],"approaches":[49],"project":[50],"onto":[52],"randomly":[53],"chosen":[54],"subspaces,":[55,69],"introducing":[56],"high":[57],"variance":[58],"degrading":[60],"empirical":[61,72],"performance;":[62],"select":[65],"most":[67],"informative":[68],"achieving":[70],"strong":[71],"results":[73],"but":[74],"lacking":[75],"convergence":[76,95,134,150],"guarantees.":[77,96],"To":[78],"address":[79],"this":[80],"gap,":[81],"we":[82,128],"propose":[83],"GreedyLore-the":[84],"first":[85,147],"Greedy":[86],"Low-Rank":[87],"algorithm":[90],"distributedlearning":[92],"with":[93],"rigorous":[94],"GreedyLore":[97,131],"incorporates":[98],"error":[99],"feedback":[100],"correct":[102],"bias":[104],"introduced":[105],"introduces":[110],"semi-lazy":[112],"subspace":[113],"update":[114],"that":[115,130],"ensures":[116],"com-pression":[118],"operator":[119],"contractive":[121],"throughout":[122],"all":[123],"iterations.":[124],"With":[125],"these":[126],"techniques,":[127],"prove":[129],"achieves":[132],"rate":[135,151],"of":[136],"<tex":[137],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[138],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{O}(\\sigma/\\sqrt{NT}^{-}+1/T)$</tex>":[139],"under":[140],"standard":[141],"optimizers":[142],"such":[143],"as":[144],"Adam-marking":[145],"linear":[148],"speedup":[149],"compression.":[155],"Extensive":[156],"experiments":[157],"conducted":[159],"validate":[161],"our":[162],"theoretical":[163],"findings.":[164]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-01-21T00:00:00"}
