{"id":"https://openalex.org/W4416542217","doi":"https://doi.org/10.48550/arxiv.2504.11903","title":"FedCanon: Non-Convex Composite Federated Learning with Efficient Proximal Operation on Heterogeneous Data","display_name":"FedCanon: Non-Convex Composite Federated Learning with Efficient Proximal Operation on Heterogeneous Data","publication_year":2025,"publication_date":"2025-04-16","ids":{"openalex":"https://openalex.org/W4416542217","doi":"https://doi.org/10.48550/arxiv.2504.11903"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2504.11903","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.11903","pdf_url":"https://arxiv.org/pdf/2504.11903","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2504.11903","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103870714","display_name":"Yuan Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhou, Yuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020894595","display_name":"Jiachen Zhong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhong, Jiachen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068429082","display_name":"Xinli Shi","orcid":"https://orcid.org/0000-0002-4443-608X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Xinli","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040088510","display_name":"Guanghui Wen","orcid":"https://orcid.org/0000-0003-0070-8597"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Guanghui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5070195520","display_name":"Xinghuo Yu","orcid":"https://orcid.org/0000-0001-8093-9787"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Xinghuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5103870714"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.8539999723434448,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.8539999723434448,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.060100000351667404,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.015399999916553497,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sublinear-function","display_name":"Sublinear function","score":0.5418999791145325},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.5170000195503235},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.49239999055862427},{"id":"https://openalex.org/keywords/rate-of-convergence","display_name":"Rate of convergence","score":0.48989999294281006},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.46810001134872437},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.41110000014305115},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.3921000063419342}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7850000262260437},{"id":"https://openalex.org/C117160843","wikidata":"https://www.wikidata.org/wiki/Q338652","display_name":"Sublinear function","level":2,"score":0.5418999791145325},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.5170000195503235},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.49239999055862427},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.48989999294281006},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.46810001134872437},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.41110000014305115},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4018999934196472},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.3921000063419342},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.3433000147342682},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.34299999475479126},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.32919999957084656},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3122999966144562},{"id":"https://openalex.org/C11210021","wikidata":"https://www.wikidata.org/wiki/Q1520713","display_name":"Linearization","level":3,"score":0.30720001459121704},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28220000863075256},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2797999978065491},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.2775000035762787},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.27239999175071716},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.26829999685287476},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.26170000433921814},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2538999915122986},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.25369998812675476}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2504.11903","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.11903","pdf_url":"https://arxiv.org/pdf/2504.11903","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2504.11903","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2504.11903","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2504.11903","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.11903","pdf_url":"https://arxiv.org/pdf/2504.11903","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416542217.pdf","grobid_xml":"https://content.openalex.org/works/W4416542217.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Composite":[0],"federated":[1,50],"learning":[2,10,51],"offers":[3],"a":[4,47,62,68,85,151,156],"general":[5,143],"framework":[6,140],"for":[7,137],"solving":[8],"machine":[9],"problems":[11,60],"with":[12],"additional":[13],"regularization":[14,73],"terms.":[15],"However,":[16],"existing":[17],"methods":[18,177],"often":[19],"face":[20],"significant":[21],"limitations:":[22],"many":[23],"require":[24],"clients":[25],"to":[26,38,56,109],"perform":[27],"computationally":[28],"expensive":[29],"proximal":[30,77,87,98],"operations,":[31],"and":[32,67,155,183],"their":[33],"performance":[34],"is":[35],"frequently":[36],"vulnerable":[37],"data":[39,116,189],"heterogeneity.":[40,117],"To":[41],"overcome":[42],"these":[43],"challenges,":[44],"we":[45],"propose":[46],"novel":[48],"composite":[49],"algorithm":[52],"called":[53],"\\textbf{FedCanon},":[54],"designed":[55],"solve":[57],"the":[58,90,96,111,122,132,142,160,164,175],"optimization":[59],"comprising":[61],"possibly":[63],"non-convex":[64,144],"loss":[65],"function":[66],"weakly":[69],"convex,":[70],"potentially":[71],"non-smooth":[72],"term.":[74],"By":[75],"decoupling":[76],"mappings":[78],"from":[79,115],"local":[80,107],"updates,":[81],"FedCanon":[82,149,173],"requires":[83],"only":[84],"single":[86],"evaluation":[88],"on":[89],"server":[91],"per":[92],"iteration,":[93],"thereby":[94],"reducing":[95],"overall":[97],"computation":[99],"cost.":[100],"Concurrently,":[101],"it":[102],"integrates":[103],"control":[104],"variables":[105],"into":[106],"updates":[108],"mitigate":[110],"client":[112],"drift":[113],"arising":[114],"The":[118,128],"entire":[119],"architecture":[120],"avoids":[121],"complex":[123],"subproblems":[124],"of":[125,180],"primal-dual":[126],"alternatives.":[127],"theoretical":[129],"analysis":[130],"provides":[131],"first":[133],"rigorous":[134],"convergence":[135,153],"guarantees":[136],"this":[138],"proximal-skipping":[139],"in":[141,178],"setting.":[145],"It":[146],"establishes":[147],"that":[148,172],"achieves":[150],"sublinear":[152],"rate,":[154],"linear":[157],"rate":[158],"under":[159,187],"Polyak-\u0141ojasiewicz":[161],"condition,":[162],"without":[163],"restrictive":[165],"bounded":[166],"heterogeneity":[167],"assumption.":[168],"Extensive":[169],"experiments":[170],"demonstrate":[171],"outperforms":[174],"state-of-the-art":[176],"terms":[179],"both":[181],"accuracy":[182],"computational":[184],"efficiency,":[185],"particularly":[186],"heterogeneous":[188],"distributions.":[190]},"counts_by_year":[],"updated_date":"2026-05-02T08:42:23.175194","created_date":"2025-10-10T00:00:00"}
