{"id":"https://openalex.org/W2966297898","doi":"https://doi.org/10.24963/ijcai.2019/637","title":"Faster Distributed Deep Net Training: Computation and Communication Decoupled Stochastic Gradient Descent","display_name":"Faster Distributed Deep Net Training: Computation and Communication Decoupled Stochastic Gradient Descent","publication_year":2019,"publication_date":"2019-07-28","ids":{"openalex":"https://openalex.org/W2966297898","doi":"https://doi.org/10.24963/ijcai.2019/637","mag":"2966297898"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2019/637","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2019/637","pdf_url":"https://www.ijcai.org/proceedings/2019/0637.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.ijcai.org/proceedings/2019/0637.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009264739","display_name":"Shuheng Shen","orcid":"https://orcid.org/0000-0001-6134-6601"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shuheng Shen","raw_affiliation_strings":["Anhui Province Key Laboratory of Big Data Analysis and Application","School of Computer Science and Technology, University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"Anhui Province Key Laboratory of Big Data Analysis and Application","institution_ids":[]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009732907","display_name":"Linli Xu","orcid":"https://orcid.org/0000-0003-0227-3793"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linli Xu","raw_affiliation_strings":["Anhui Province Key Laboratory of Big Data Analysis and Application","School of Computer Science and Technology, University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"Anhui Province Key Laboratory of Big Data Analysis and Application","institution_ids":[]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054743312","display_name":"Jingchang Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingchang Liu","raw_affiliation_strings":["Anhui Province Key Laboratory of Big Data Analysis and Application","School of Computer Science and Technology, University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"Anhui Province Key Laboratory of Big Data Analysis and Application","institution_ids":[]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072210488","display_name":"Xianfeng Liang","orcid":"https://orcid.org/0000-0003-4055-1985"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xianfeng Liang","raw_affiliation_strings":["Anhui Province Key Laboratory of Big Data Analysis and Application","School of Computer Science and Technology, University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"Anhui Province Key Laboratory of Big Data Analysis and Application","institution_ids":[]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007825653","display_name":"Yifei Cheng","orcid":"https://orcid.org/0000-0003-3859-2921"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yifei Cheng","raw_affiliation_strings":["Anhui Province Key Laboratory of Big Data Analysis and Application","School of Data Science, University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"Anhui Province Key Laboratory of Big Data Analysis and Application","institution_ids":[]},{"raw_affiliation_string":"School of Data Science, University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5009264739"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":1.5896,"has_fulltext":false,"cited_by_count":19,"citation_normalized_percentile":{"value":0.8783325,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"4582","last_page":"4589"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.9816503524780273},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.8419970273971558},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8176499605178833},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6893691420555115},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5188106894493103},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.4753655791282654},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.38353216648101807},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3624972403049469},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.33766472339630127}],"concepts":[{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.9816503524780273},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.8419970273971558},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8176499605178833},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6893691420555115},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5188106894493103},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.4753655791282654},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.38353216648101807},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3624972403049469},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33766472339630127}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.24963/ijcai.2019/637","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2019/637","pdf_url":"https://www.ijcai.org/proceedings/2019/0637.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.24963/ijcai.2019/637","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2019/637","pdf_url":"https://www.ijcai.org/proceedings/2019/0637.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2376276132","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5375682351","display_name":null,"funder_award_id":"91746301","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6013138505","display_name":null,"funder_award_id":"21501100","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6058138561","display_name":null,"funder_award_id":", No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6606293491","display_name":null,"funder_award_id":"61673364","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8982980116","display_name":null,"funder_award_id":"WK2150110008","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320325599","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2966297898.pdf","grobid_xml":"https://content.openalex.org/works/W2966297898.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W778657980","https://openalex.org/W1686810756","https://openalex.org/W1964981582","https://openalex.org/W2049469158","https://openalex.org/W2127941149","https://openalex.org/W2130062883","https://openalex.org/W2186615578","https://openalex.org/W2194775991","https://openalex.org/W2336650964","https://openalex.org/W2617766261","https://openalex.org/W2622263826","https://openalex.org/W2769644379","https://openalex.org/W2774000609","https://openalex.org/W2886404071","https://openalex.org/W2899771611","https://openalex.org/W2953384591","https://openalex.org/W2962700998","https://openalex.org/W2963179579","https://openalex.org/W2963470657","https://openalex.org/W2963766684","https://openalex.org/W3101036738","https://openalex.org/W3102816259","https://openalex.org/W3118608800","https://openalex.org/W4301239768"],"related_works":["https://openalex.org/W2317245370","https://openalex.org/W4249323025","https://openalex.org/W198851386","https://openalex.org/W2030310580","https://openalex.org/W947442053","https://openalex.org/W1980160788","https://openalex.org/W2148915962","https://openalex.org/W2283866686","https://openalex.org/W2319266294","https://openalex.org/W2966297898"],"abstract_inverted_index":{"With":[0],"the":[1,4,9,25,49,85,100,105,133],"increase":[2],"in":[3,46,81],"amount":[5],"of":[6,11,104,136],"data":[7],"and":[8,20,68,79,116,141],"expansion":[10],"model":[12],"scale,":[13],"distributed":[14,30,123],"parallel":[15,82],"training":[16,131,139],"becomes":[17],"an":[18],"important":[19],"successful":[21],"technique":[22],"to":[23,55,76,83,99,152],"address":[24],"optimization":[26],"challenges.":[27],"Nevertheless,":[28],"although":[29],"stochastic":[31,71],"gradient":[32,72],"descent":[33,73],"(SGD)":[34],"algorithms":[35],"can":[36],"achieve":[37,56],"a":[38,57,66,93,112],"linear":[39,58,94],"iteration":[40,95],"speedup,":[41],"they":[42],"are":[43],"limited":[44],"significantly":[45],"practice":[47],"by":[48],"communication":[50,69,80,86,114],"cost,":[51],"making":[52],"it":[53,110],"difficult":[54],"time":[59,118],"speedup.":[60],"In":[61,108],"this":[62],"paper,":[63],"we":[64],"propose":[65],"computation":[67,78,102],"decoupled":[70],"(CoCoD-SGD)":[74],"algorithm":[75],"run":[77],"reduce":[84],"cost.":[87],"We":[88],"prove":[89],"that":[90],"CoCoD-SGD":[91,149],"has":[92,111],"speedup":[96,119],"with":[97,121,143],"respect":[98],"total":[101],"capability":[103],"hardware":[106],"resources.":[107],"addition,":[109],"lower":[113],"complexity":[115],"better":[117],"comparing":[120],"traditional":[122,157],"SGD":[124],"algorithms.":[125],"Experiments":[126],"on":[127],"deep":[128],"neural":[129],"network":[130],"demonstrate":[132],"significant":[134],"improvements":[135],"CoCoD-SGD:":[137],"when":[138],"ResNet18":[140],"VGG16":[142],"16":[144],"Geforce":[145],"GTX":[146],"1080Ti":[147],"GPUs,":[148],"is":[150],"up":[151],"2-3":[153],"x":[154],"faster":[155],"than":[156],"synchronous":[158],"SGD.":[159]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
