{"id":"https://openalex.org/W2948092338","doi":"https://doi.org/10.1109/jsait.2020.2985917","title":"Qsparse-Local-SGD: Distributed SGD With Quantization, Sparsification, and Local Computations","display_name":"Qsparse-Local-SGD: Distributed SGD With Quantization, Sparsification, and Local Computations","publication_year":2020,"publication_date":"2020-04-07","ids":{"openalex":"https://openalex.org/W2948092338","doi":"https://doi.org/10.1109/jsait.2020.2985917","mag":"2948092338"},"language":"en","primary_location":{"id":"doi:10.1109/jsait.2020.2985917","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jsait.2020.2985917","pdf_url":null,"source":{"id":"https://openalex.org/S4210211895","display_name":"IEEE Journal on Selected Areas in Information Theory","issn_l":"2641-8770","issn":["2641-8770"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal on Selected Areas in Information Theory","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1906.02367","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067849515","display_name":"Debraj Basu","orcid":"https://orcid.org/0000-0003-3130-4253"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]},{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Debraj Basu","raw_affiliation_strings":["Adobe, Inc., San Jose, USA","Electrical and Computer Engineering, University of California at Los Angeles, Los Angeles, USA","[Adobe Systems]"],"affiliations":[{"raw_affiliation_string":"Adobe, Inc., San Jose, USA","institution_ids":["https://openalex.org/I1306409833"]},{"raw_affiliation_string":"Electrical and Computer Engineering, University of California at Los Angeles, Los Angeles, USA","institution_ids":["https://openalex.org/I161318765"]},{"raw_affiliation_string":"[Adobe Systems]","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023777978","display_name":"Deepesh Data","orcid":"https://orcid.org/0000-0003-3544-8414"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Deepesh Data","raw_affiliation_strings":["Electrical and Computer Engineering, University of California at Los Angeles, Los Angeles, USA","University of California, Los Angeles, Los Angeles, United States"],"affiliations":[{"raw_affiliation_string":"Electrical and Computer Engineering, University of California at Los Angeles, Los Angeles, USA","institution_ids":["https://openalex.org/I161318765"]},{"raw_affiliation_string":"University of California, Los Angeles, Los Angeles, United States","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103177913","display_name":"Can Karakus","orcid":"https://orcid.org/0000-0001-6878-6984"},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]},{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]},{"id":"https://openalex.org/I4210089985","display_name":"Amazon (Germany)","ror":"https://ror.org/00b9ktm87","country_code":"DE","type":"company","lineage":["https://openalex.org/I1311688040","https://openalex.org/I4210089985"]}],"countries":["DE","US"],"is_corresponding":false,"raw_author_name":"Can Karakus","raw_affiliation_strings":["Amazon Web Services, Seattle, USA","Electrical and Computer Engineering, University of California at Los Angeles, Los Angeles, USA","Amazon"],"affiliations":[{"raw_affiliation_string":"Amazon Web Services, Seattle, USA","institution_ids":["https://openalex.org/I1311688040"]},{"raw_affiliation_string":"Electrical and Computer Engineering, University of California at Los Angeles, Los Angeles, USA","institution_ids":["https://openalex.org/I161318765"]},{"raw_affiliation_string":"Amazon","institution_ids":["https://openalex.org/I4210089985"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083980887","display_name":"Suhas Diggavi","orcid":"https://orcid.org/0000-0001-7313-9861"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Suhas N. Diggavi","raw_affiliation_strings":["Electrical and Computer Engineering, University of California at Los Angeles, Los Angeles, USA","University of California-Los Angeles"],"affiliations":[{"raw_affiliation_string":"Electrical and Computer Engineering, University of California at Los Angeles, Los Angeles, USA","institution_ids":["https://openalex.org/I161318765"]},{"raw_affiliation_string":"University of California-Los Angeles","institution_ids":["https://openalex.org/I161318765"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5067849515"],"corresponding_institution_ids":["https://openalex.org/I1306409833","https://openalex.org/I161318765"],"apc_list":null,"apc_paid":null,"fwci":2.3356,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.87050283,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"1","issue":"1","first_page":"217","last_page":"226"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6325991749763489},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6321519613265991},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6107487082481384},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.5979855060577393},{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.5393736958503723},{"id":"https://openalex.org/keywords/rate-of-convergence","display_name":"Rate of convergence","score":0.48615762591362},{"id":"https://openalex.org/keywords/regular-polygon","display_name":"Regular polygon","score":0.4672883152961731},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4096089005470276},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3354809582233429},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.29534822702407837},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.1538802981376648},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.07334080338478088},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.07075530290603638}],"concepts":[{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6325991749763489},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6321519613265991},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6107487082481384},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.5979855060577393},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.5393736958503723},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.48615762591362},{"id":"https://openalex.org/C112680207","wikidata":"https://www.wikidata.org/wiki/Q714886","display_name":"Regular polygon","level":2,"score":0.4672883152961731},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4096089005470276},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3354809582233429},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.29534822702407837},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.1538802981376648},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.07334080338478088},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.07075530290603638},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1109/jsait.2020.2985917","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jsait.2020.2985917","pdf_url":null,"source":{"id":"https://openalex.org/S4210211895","display_name":"IEEE Journal on Selected Areas in Information Theory","issn_l":"2641-8770","issn":["2641-8770"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal on Selected Areas in Information Theory","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1906.02367","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.02367","pdf_url":"https://arxiv.org/pdf/1906.02367","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2948092338","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/1906.02367","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1906.02367","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1906.02367","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"mag:2971064744","is_oa":false,"landing_page_url":"https://papers.nips.cc/paper/9610-qsparse-local-sgd-distributed-sgd-with-quantization-sparsification-and-local-computations.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306420609","display_name":"Neural Information Processing Systems","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"Neural Information Processing Systems","raw_type":null}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1906.02367","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.02367","pdf_url":"https://arxiv.org/pdf/1906.02367","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1637379582","display_name":null,"funder_award_id":"W911NF-17-2-0196","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"},{"id":"https://openalex.org/G4498150772","display_name":null,"funder_award_id":"1514531","funder_id":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka"}],"funders":[{"id":"https://openalex.org/F4320335353","display_name":"National Science Foundation of Sri Lanka","ror":"https://ror.org/010xaa060"},{"id":"https://openalex.org/F4320338295","display_name":"Army Research Laboratory","ror":"https://ror.org/011hc8f90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":77,"referenced_works":["https://openalex.org/W114517082","https://openalex.org/W1415242555","https://openalex.org/W1992208280","https://openalex.org/W1994616650","https://openalex.org/W2103325786","https://openalex.org/W2108475251","https://openalex.org/W2112269233","https://openalex.org/W2112796928","https://openalex.org/W2138243089","https://openalex.org/W2142623206","https://openalex.org/W2143908786","https://openalex.org/W2154682027","https://openalex.org/W2156779765","https://openalex.org/W2162576315","https://openalex.org/W2180530054","https://openalex.org/W2194775991","https://openalex.org/W2402144811","https://openalex.org/W2405578611","https://openalex.org/W2405883473","https://openalex.org/W2407022425","https://openalex.org/W2460815216","https://openalex.org/W2541884796","https://openalex.org/W2547352193","https://openalex.org/W2605994693","https://openalex.org/W2606891064","https://openalex.org/W2729686365","https://openalex.org/W2787998955","https://openalex.org/W2888561381","https://openalex.org/W2889676205","https://openalex.org/W2890924858","https://openalex.org/W2896457183","https://openalex.org/W2900182564","https://openalex.org/W2911327153","https://openalex.org/W2911863041","https://openalex.org/W2944542720","https://openalex.org/W2951781666","https://openalex.org/W2962952793","https://openalex.org/W2963179579","https://openalex.org/W2963335821","https://openalex.org/W2963540381","https://openalex.org/W2963664311","https://openalex.org/W2963766684","https://openalex.org/W2963803379","https://openalex.org/W2964004663","https://openalex.org/W2964121744","https://openalex.org/W2964163156","https://openalex.org/W2964267428","https://openalex.org/W3101036738","https://openalex.org/W6628022308","https://openalex.org/W6631190155","https://openalex.org/W6676540010","https://openalex.org/W6676963778","https://openalex.org/W6680402377","https://openalex.org/W6682774789","https://openalex.org/W6683245038","https://openalex.org/W6684583874","https://openalex.org/W6685655662","https://openalex.org/W6713134421","https://openalex.org/W6713835734","https://openalex.org/W6714239094","https://openalex.org/W6728757088","https://openalex.org/W6728975057","https://openalex.org/W6738460352","https://openalex.org/W6739513683","https://openalex.org/W6745723224","https://openalex.org/W6746200960","https://openalex.org/W6746839373","https://openalex.org/W6748019269","https://openalex.org/W6748304459","https://openalex.org/W6751646691","https://openalex.org/W6752012617","https://openalex.org/W6752191696","https://openalex.org/W6754341472","https://openalex.org/W6754416507","https://openalex.org/W6758358981","https://openalex.org/W6758557334","https://openalex.org/W6763549698"],"related_works":["https://openalex.org/W2971064744","https://openalex.org/W2950953465","https://openalex.org/W3097291876","https://openalex.org/W2769644379","https://openalex.org/W2998304172","https://openalex.org/W3124360785","https://openalex.org/W2800887228","https://openalex.org/W2964267428","https://openalex.org/W2743961547","https://openalex.org/W3011425085","https://openalex.org/W2913259183","https://openalex.org/W2126290786","https://openalex.org/W3101036738","https://openalex.org/W2942276578","https://openalex.org/W2908936460","https://openalex.org/W2954590635","https://openalex.org/W1596024815","https://openalex.org/W2573736728","https://openalex.org/W2429995037","https://openalex.org/W3036128815"],"abstract_inverted_index":{"Communication":[0],"bottleneck":[1],"has":[2],"been":[3,24],"identified":[4],"as":[5,106],"a":[6],"significant":[7,132],"issue":[8],"in":[9,86,131,137],"distributed":[10,88,108],"optimization":[11],"of":[12,29,63,79,114,140],"large-scale":[13],"learning":[14],"models.":[15],"Recently,":[16],"several":[17],"approaches":[18],"to":[19,121,143],"mitigate":[20],"this":[21,41],"problem":[22],"have":[23],"proposed,":[25],"including":[26],"different":[27],"forms":[28],"gradient":[30],"compression":[31],"or":[32],"computing":[33],"local":[34,54],"models":[35],"and":[36,53,69,76,93,116,126],"mixing":[37],"them":[38],"iteratively.":[39],"In":[40],"paper,":[42],"we":[43],"propose":[44,73],"Qsparse-local-SGD":[45,85,100,120],"algorithm,":[46],"which":[47],"combines":[48],"aggressive":[49],"sparsification":[50],"with":[51,57],"quantization":[52],"computation":[55],"along":[56],"error":[58],"compensation,":[59],"by":[60],"keeping":[61],"track":[62],"the":[64,67,87,103,135,138],"difference":[65],"between":[66],"true":[68],"compressed":[70],"gradients.":[71],"We":[72,81,97,118],"both":[74],"synchronous":[75],"asynchronous":[77],"implementations":[78],"Qsparse-local-SGD.":[80],"analyze":[82],"convergence":[83],"for":[84,90,110],"setting":[89],"smooth":[91],"non-convex":[92],"convex":[94],"objective":[95],"functions.":[96],"demonstrate":[98],"that":[99,128],"converges":[101],"at":[102],"same":[104],"rate":[105],"vanilla":[107],"SGD":[109],"many":[111],"important":[112],"classes":[113],"sparsifiers":[115],"quantizers.":[117],"use":[119],"train":[122],"ResNet-50":[123],"on":[124],"ImageNet":[125],"show":[127],"it":[129],"results":[130],"savings":[133],"over":[134],"state-of-the-art,":[136],"number":[139],"bits":[141],"transmitted":[142],"reach":[144],"target":[145],"accuracy.":[146]},"counts_by_year":[{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":2}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
