{"id":"https://openalex.org/W3094279629","doi":"https://doi.org/10.1145/3412815.3416891","title":"Toward Communication Efficient Adaptive Gradient Method","display_name":"Toward Communication Efficient Adaptive Gradient Method","publication_year":2020,"publication_date":"2020-10-15","ids":{"openalex":"https://openalex.org/W3094279629","doi":"https://doi.org/10.1145/3412815.3416891","mag":"3094279629"},"language":"en","primary_location":{"id":"doi:10.1145/3412815.3416891","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3412815.3416891","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 ACM-IMS on Foundations of Data Science Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049896980","display_name":"Xiangyi Chen","orcid":"https://orcid.org/0000-0001-5549-5336"},"institutions":[{"id":"https://openalex.org/I4210108985","display_name":"Bellevue Hospital Center","ror":"https://ror.org/01ky34z31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1283621791","https://openalex.org/I4210086933","https://openalex.org/I4210108985"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xiangyi Chen","raw_affiliation_strings":["Baidu Research, Bellevue, WA, USA"],"affiliations":[{"raw_affiliation_string":"Baidu Research, Bellevue, WA, USA","institution_ids":["https://openalex.org/I4210108985"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100781895","display_name":"Xiaoyun Li","orcid":"https://orcid.org/0000-0001-5730-2972"},"institutions":[{"id":"https://openalex.org/I4210108985","display_name":"Bellevue Hospital Center","ror":"https://ror.org/01ky34z31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1283621791","https://openalex.org/I4210086933","https://openalex.org/I4210108985"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaoyun Li","raw_affiliation_strings":["Baidu Research, Bellevue, WA, USA"],"affiliations":[{"raw_affiliation_string":"Baidu Research, Bellevue, WA, USA","institution_ids":["https://openalex.org/I4210108985"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100435527","display_name":"Ping Li","orcid":"https://orcid.org/0000-0002-5979-8868"},"institutions":[{"id":"https://openalex.org/I4210108985","display_name":"Bellevue Hospital Center","ror":"https://ror.org/01ky34z31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1283621791","https://openalex.org/I4210086933","https://openalex.org/I4210108985"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ping Li","raw_affiliation_strings":["Baidu Research, Bellevue, WA, USA"],"affiliations":[{"raw_affiliation_string":"Baidu Research, Bellevue, WA, USA","institution_ids":["https://openalex.org/I4210108985"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5049896980"],"corresponding_institution_ids":["https://openalex.org/I4210108985"],"apc_list":null,"apc_paid":null,"fwci":1.92,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.89002761,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"119","last_page":"128"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8543426990509033},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.8428744077682495},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5837100148200989},{"id":"https://openalex.org/keywords/distributed-learning","display_name":"Distributed learning","score":0.5731565356254578},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5480192303657532},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5226718783378601},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.4906970262527466},{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.4668577015399933},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4638383984565735},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.459223210811615},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4481297731399536},{"id":"https://openalex.org/keywords/adaptive-learning","display_name":"Adaptive learning","score":0.4358070194721222},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.41654467582702637},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.14506471157073975},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.10457700490951538},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.09710583090782166}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8543426990509033},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.8428744077682495},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5837100148200989},{"id":"https://openalex.org/C2779582901","wikidata":"https://www.wikidata.org/wiki/Q21013010","display_name":"Distributed learning","level":2,"score":0.5731565356254578},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5480192303657532},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5226718783378601},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.4906970262527466},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.4668577015399933},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4638383984565735},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.459223210811615},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4481297731399536},{"id":"https://openalex.org/C125014702","wikidata":"https://www.wikidata.org/wiki/Q4680749","display_name":"Adaptive learning","level":2,"score":0.4358070194721222},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.41654467582702637},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.14506471157073975},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.10457700490951538},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.09710583090782166},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3412815.3416891","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3412815.3416891","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 ACM-IMS on Foundations of Data Science Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W6908809","https://openalex.org/W1522301498","https://openalex.org/W2021404082","https://openalex.org/W2060393849","https://openalex.org/W2138243089","https://openalex.org/W2146502635","https://openalex.org/W2541884796","https://openalex.org/W2560674852","https://openalex.org/W2605800822","https://openalex.org/W2606098075","https://openalex.org/W2617766261","https://openalex.org/W2626325961","https://openalex.org/W2744599870","https://openalex.org/W2766140019","https://openalex.org/W2769644379","https://openalex.org/W2774000609","https://openalex.org/W2776855315","https://openalex.org/W2803867449","https://openalex.org/W2804993962","https://openalex.org/W2886463271","https://openalex.org/W2886837499","https://openalex.org/W2886849295","https://openalex.org/W2907225497","https://openalex.org/W2912323147","https://openalex.org/W2944542720","https://openalex.org/W2945586457","https://openalex.org/W2945785363","https://openalex.org/W2946270031","https://openalex.org/W2946511237","https://openalex.org/W2950960796","https://openalex.org/W2951651062","https://openalex.org/W2963698657","https://openalex.org/W2975043678","https://openalex.org/W2978329087","https://openalex.org/W2991209658","https://openalex.org/W3010969086","https://openalex.org/W3012796061","https://openalex.org/W3048687543","https://openalex.org/W3102816259","https://openalex.org/W4247777826","https://openalex.org/W4310895557","https://openalex.org/W6684249991","https://openalex.org/W6754654111"],"related_works":["https://openalex.org/W2595172197","https://openalex.org/W2084856301","https://openalex.org/W2127970246","https://openalex.org/W2885125400","https://openalex.org/W1989889224","https://openalex.org/W4382618745","https://openalex.org/W1973775000","https://openalex.org/W2748922771","https://openalex.org/W1987128138","https://openalex.org/W2743976221"],"abstract_inverted_index":{"In":[0,137],"recent":[1],"years,":[2],"distributed":[3,39,62],"optimization":[4],"is":[5,41,77,135],"proven":[6,120],"to":[7,12,46,81,91],"be":[8],"an":[9,142],"effective":[10,121],"approach":[11],"accelerate":[13],"training":[14,36,40,53,63,112,123],"of":[15,31,35,52,85,103,128],"large":[16],"scale":[17],"machine":[18,54],"learning":[19,55,76,134],"models":[20,56],"such":[21],"as":[22,109],"deep":[23],"neural":[24,124],"networks.":[25],"With":[26],"the":[27,33,50,82,93,110,126,150,153],"increasing":[28],"computation":[29,45],"power":[30],"GPUs,":[32],"bottleneck":[34],"speed":[37],"in":[38,49,74,132],"gradually":[42],"shifting":[43],"from":[44],"communication.":[47],"Meanwhile,":[48],"hope":[51],"on":[57],"mobile":[58,86],"devices,":[59],"a":[60],"new":[61],"paradigm":[64],"called":[65],"\"federated":[66],"learning''":[67],"has":[68],"become":[69],"popular.":[70],"The":[71],"communication":[72,94,154],"time":[73],"federated":[75,100,133,157],"especially":[78],"important":[79],"due":[80],"low":[83],"bandwidth":[84],"devices.":[87],"While":[88,114],"various":[89],"approaches":[90],"improve":[92],"efficiency":[95,155],"have":[96,118],"been":[97,119],"proposed":[98],"for":[99,122,156],"learning,":[101],"most":[102],"them":[104],"are":[105],"designed":[106],"with":[107],"SGD":[108],"prototype":[111],"algorithm.":[113],"adaptive":[115,129,143],"gradient":[116,130,144],"methods":[117,131],"nets,":[125],"study":[127],"scarce.":[136],"this":[138],"paper,":[139],"we":[140],"propose":[141],"method":[145],"that":[146],"can":[147],"guarantee":[148],"both":[149],"convergence":[151],"and":[152],"learning.":[158]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
