{"id":"https://openalex.org/W7084129775","doi":"https://doi.org/10.1109/infocom55648.2025.11044558","title":"\u03b3-FedHT: Stepsize-Aware Hard-Threshold Gradient Compression in Federated Learning","display_name":"\u03b3-FedHT: Stepsize-Aware Hard-Threshold Gradient Compression in Federated Learning","publication_year":2025,"publication_date":"2025-05-19","ids":{"openalex":"https://openalex.org/W7084129775","doi":"https://doi.org/10.1109/infocom55648.2025.11044558"},"language":"en","primary_location":{"id":"doi:10.1109/infocom55648.2025.11044558","is_oa":false,"landing_page_url":"https://doi.org/10.1109/infocom55648.2025.11044558","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE INFOCOM 2025 - IEEE Conference on Computer Communications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Rongwei Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Rongwei Lu","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yutong Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yutong Jiang","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jinrui Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinrui Zhang","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Chunyang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunyang Li","raw_affiliation_strings":["Harbin Institute of Technology,Shenzhen"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology,Shenzhen","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yifei Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yifei Zhu","raw_affiliation_strings":["UM-SJTU Joint Institute, Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"UM-SJTU Joint Institute, Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Bin Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Chen","raw_affiliation_strings":["Harbin Institute of Technology,Shenzhen"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology,Shenzhen","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":null,"display_name":"Zhi Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhi Wang","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.76936622,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.65829998254776,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.65829998254776,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13067","display_name":"Geological Modeling and Analysis","score":0.024299999698996544,"subfield":{"id":"https://openalex.org/subfields/1906","display_name":"Geochemistry and Petrology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10271","display_name":"Seismic Imaging and Inversion Techniques","score":0.018799999728798866,"subfield":{"id":"https://openalex.org/subfields/1908","display_name":"Geophysics"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.636900007724762},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.5371000170707703},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5056999921798706},{"id":"https://openalex.org/keywords/compression-ratio","display_name":"Compression ratio","score":0.4909999966621399},{"id":"https://openalex.org/keywords/regular-polygon","display_name":"Regular polygon","score":0.45829999446868896},{"id":"https://openalex.org/keywords/data-compression-ratio","display_name":"Data compression ratio","score":0.4212000072002411},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.39149999618530273},{"id":"https://openalex.org/keywords/rate-of-convergence","display_name":"Rate of convergence","score":0.37389999628067017}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7249000072479248},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.636900007724762},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.5371000170707703},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.510699987411499},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5056999921798706},{"id":"https://openalex.org/C25797200","wikidata":"https://www.wikidata.org/wiki/Q828137","display_name":"Compression ratio","level":3,"score":0.4909999966621399},{"id":"https://openalex.org/C112680207","wikidata":"https://www.wikidata.org/wiki/Q714886","display_name":"Regular polygon","level":2,"score":0.45829999446868896},{"id":"https://openalex.org/C94835093","wikidata":"https://www.wikidata.org/wiki/Q3113333","display_name":"Data compression ratio","level":5,"score":0.4212000072002411},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.39149999618530273},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.37389999628067017},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.34689998626708984},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.3221000134944916},{"id":"https://openalex.org/C131097465","wikidata":"https://www.wikidata.org/wiki/Q178898","display_name":"Gas compressor","level":2,"score":0.3125},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.30329999327659607},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.2987000048160553},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.296999990940094},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28200000524520874},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.2766000032424927},{"id":"https://openalex.org/C2992525071","wikidata":"https://www.wikidata.org/wiki/Q50818671","display_name":"Federated learning","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C145446738","wikidata":"https://www.wikidata.org/wiki/Q319913","display_name":"Convex function","level":3,"score":0.26440000534057617},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.2599000036716461},{"id":"https://openalex.org/C311688","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Time complexity","level":2,"score":0.2522999942302704}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/infocom55648.2025.11044558","is_oa":false,"landing_page_url":"https://doi.org/10.1109/infocom55648.2025.11044558","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE INFOCOM 2025 - IEEE Conference on Computer Communications","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Gradient":[0],"compression":[1,68,99,104],"can":[2],"effectively":[3],"alleviate":[4],"communication":[5,215],"bottlenecks":[6],"in":[7,72],"Federated":[8],"Learning":[9],"(FL).":[10],"Contemporary":[11],"state-of-the-art":[12],"sparse":[13],"compressors,":[14],"such":[15],"as":[16,194],"Top-<tex":[17,210],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[18,27,31,63,83,132,166,174,182,188,201,211],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$k$</tex>,":[19],"exhibit":[20],"high":[21],"computational":[22],"complexity,":[23],"up":[24,206],"to":[25,57,61,105,108,123,140,207],"<tex":[26,30,62,82,131,165,173,181,187,200],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{O}(d\\log_{2}k)$</tex>,":[28],"where":[29,74],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$d$</tex>":[32],"is":[33,54,85],"the":[34,59,66,75,80,94,98,102,117,145,157,169],"number":[35],"of":[36,101,149,160,172],"model":[37,88,118],"parameters.":[38],"The":[39,90],"hard-threshold":[40,67,103],"compressor,":[41],"which":[42],"simply":[43],"transmits":[44],"elements":[45],"with":[46,138],"absolute":[47],"values":[48],"higher":[49],"than":[50],"a":[51,134],"fixed":[52],"threshold,":[53],"thus":[55],"proposed":[56],"reduce":[58],"complexity":[60],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{O}(d)$</tex>.":[64],"However,":[65],"causes":[69,97],"accuracy":[70,119,204],"degradation":[71],"FL,":[73],"datasets":[76],"are":[77],"non-IID":[78,219],"and":[79,96,186],"stepsize":[81,92],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\gamma$</tex>":[84],"decreasing":[86],"for":[87],"convergence.":[89,142],"decaying":[91],"reduces":[93],"updates":[95],"ratio":[100],"drop":[106],"rapidly":[107],"an":[109],"aggressive":[110],"ratio.":[111],"At":[112],"or":[113],"below":[114],"this":[115],"ratio,":[116],"has":[120,168],"been":[121],"observed":[122],"degrade":[124],"severely.":[125],"To":[126],"address":[127],"this,":[128],"we":[129,155],"propose":[130],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\gamma$</tex>-FedHT,":[133],"stepsize-aware":[135],"low-cost":[136],"compressor":[137],"Error-Feedback":[139],"guarantee":[141],"Given":[143],"that":[144,164,199],"traditional":[146],"theoretical":[147],"framework":[148],"FL":[150],"does":[151],"not":[152],"consider":[153],"Error-Feedback,":[154],"introduce":[156],"fundamental":[158],"conversation":[159],"Error-Feedback.":[161],"We":[162],"prove":[163],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\gamma$</tex>-FedHT":[167,202],"convergence":[170],"rate":[171],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{O}\\left(\\frac{1}{T}\\right)(T$</tex>":[175],"representing":[176],"total":[177],"training":[178],"iterations)":[179],"under":[180,190,213],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mu$</tex>-strongly":[183],"convex":[184],"cases":[185],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{O}\\left(\\frac{1}{\\sqrt{T}}\\right)$</tex>":[189],"non-convex":[191],"cases,":[192],"same":[193],"FedAVG.":[195],"Extensive":[196],"experiments":[197],"demonstrate":[198],"improves":[203],"by":[205],"7.42%":[208],"over":[209],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$k$</tex>":[212],"equal":[214],"traffic":[216],"on":[217],"various":[218],"image":[220],"datasets.":[221]},"counts_by_year":[],"updated_date":"2025-12-21T23:12:01.093139","created_date":"2025-10-10T00:00:00"}
