{"id":"https://openalex.org/W2804294608","doi":"https://doi.org/10.1109/ijcnn.2019.8852172","title":"Sparse Binary Compression: Towards Distributed Deep Learning with minimal Communication","display_name":"Sparse Binary Compression: Towards Distributed Deep Learning with minimal Communication","publication_year":2019,"publication_date":"2019-07-01","ids":{"openalex":"https://openalex.org/W2804294608","doi":"https://doi.org/10.1109/ijcnn.2019.8852172","mag":"2804294608"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn.2019.8852172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2019.8852172","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1805.08768","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009304455","display_name":"Felix Sattler","orcid":"https://orcid.org/0000-0002-9425-2238"},"institutions":[{"id":"https://openalex.org/I2800274787","display_name":"Fraunhofer Institute for Telecommunications, Heinrich Hertz Institute","ror":"https://ror.org/02tbr6331","country_code":"DE","type":"facility","lineage":["https://openalex.org/I2800274787","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Felix Sattler","raw_affiliation_strings":["Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany","[Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany]"],"affiliations":[{"raw_affiliation_string":"Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany","institution_ids":["https://openalex.org/I2800274787"]},{"raw_affiliation_string":"[Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany]","institution_ids":["https://openalex.org/I2800274787"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013534474","display_name":"Simon Wiedemann","orcid":"https://orcid.org/0000-0001-5144-3758"},"institutions":[{"id":"https://openalex.org/I2800274787","display_name":"Fraunhofer Institute for Telecommunications, Heinrich Hertz Institute","ror":"https://ror.org/02tbr6331","country_code":"DE","type":"facility","lineage":["https://openalex.org/I2800274787","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Simon Wiedemann","raw_affiliation_strings":["Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany","[Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany]"],"affiliations":[{"raw_affiliation_string":"Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany","institution_ids":["https://openalex.org/I2800274787"]},{"raw_affiliation_string":"[Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany]","institution_ids":["https://openalex.org/I2800274787"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107838719","display_name":"Klaus\u2010Robert M\u00fcller","orcid":null},"institutions":[{"id":"https://openalex.org/I4577782","display_name":"Technische Universit\u00e4t Berlin","ror":"https://ror.org/03v4gjf40","country_code":"DE","type":"education","lineage":["https://openalex.org/I4577782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Klaus-Robert Muller","raw_affiliation_strings":["Machine Learning Group, TU Berlin, Berlin, Germany"],"affiliations":[{"raw_affiliation_string":"Machine Learning Group, TU Berlin, Berlin, Germany","institution_ids":["https://openalex.org/I4577782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026451495","display_name":"Wojciech Samek","orcid":"https://orcid.org/0000-0002-6283-3265"},"institutions":[{"id":"https://openalex.org/I2800274787","display_name":"Fraunhofer Institute for Telecommunications, Heinrich Hertz Institute","ror":"https://ror.org/02tbr6331","country_code":"DE","type":"facility","lineage":["https://openalex.org/I2800274787","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Wojciech Samek","raw_affiliation_strings":["Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany","[Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany]"],"affiliations":[{"raw_affiliation_string":"Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany","institution_ids":["https://openalex.org/I2800274787"]},{"raw_affiliation_string":"[Dept. of Video Coding and Analytics, Fraunhofer HHI, Berlin, Germany]","institution_ids":["https://openalex.org/I2800274787"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5009304455"],"corresponding_institution_ids":["https://openalex.org/I2800274787"],"apc_list":null,"apc_paid":null,"fwci":1.124,"has_fulltext":true,"cited_by_count":15,"citation_normalized_percentile":{"value":0.81665982,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8055438995361328},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.5098604559898376},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5093251466751099},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.4797888398170471},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4697601795196533},{"id":"https://openalex.org/keywords/upstream","display_name":"Upstream (networking)","score":0.45358091592788696},{"id":"https://openalex.org/keywords/compression-ratio","display_name":"Compression ratio","score":0.4491550326347351},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.4448287785053253},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.43247509002685547},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4176286458969116},{"id":"https://openalex.org/keywords/terabyte","display_name":"Terabyte","score":0.41159260272979736},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3809768557548523},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3700886368751526},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.332084059715271},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.22739624977111816},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.09670361876487732},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08983847498893738}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8055438995361328},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.5098604559898376},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5093251466751099},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.4797888398170471},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4697601795196533},{"id":"https://openalex.org/C191172861","wikidata":"https://www.wikidata.org/wiki/Q7899321","display_name":"Upstream (networking)","level":2,"score":0.45358091592788696},{"id":"https://openalex.org/C25797200","wikidata":"https://www.wikidata.org/wiki/Q828137","display_name":"Compression ratio","level":3,"score":0.4491550326347351},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.4448287785053253},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.43247509002685547},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4176286458969116},{"id":"https://openalex.org/C199683683","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Terabyte","level":2,"score":0.41159260272979736},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3809768557548523},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3700886368751526},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.332084059715271},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.22739624977111816},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.09670361876487732},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08983847498893738},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C511840579","wikidata":"https://www.wikidata.org/wiki/Q12757","display_name":"Internal combustion engine","level":2,"score":0.0},{"id":"https://openalex.org/C171146098","wikidata":"https://www.wikidata.org/wiki/Q124192","display_name":"Automotive engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/ijcnn.2019.8852172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2019.8852172","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1805.08768","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1805.08768","pdf_url":"https://arxiv.org/pdf/1805.08768","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2804294608","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/1805.08768","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1805.08768","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1805.08768","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1805.08768","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1805.08768","pdf_url":"https://arxiv.org/pdf/1805.08768","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321773","display_name":"Fraunhofer-Gesellschaft","ror":"https://ror.org/05hkkdn48"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2804294608.pdf","grobid_xml":"https://content.openalex.org/works/W2804294608.grobid-xml"},"referenced_works_count":51,"referenced_works":["https://openalex.org/W1442374986","https://openalex.org/W1522301498","https://openalex.org/W1591801644","https://openalex.org/W1632114991","https://openalex.org/W2053637704","https://openalex.org/W2095705004","https://openalex.org/W2108598243","https://openalex.org/W2112796928","https://openalex.org/W2115613939","https://openalex.org/W2194775991","https://openalex.org/W2198403777","https://openalex.org/W2283463896","https://openalex.org/W2405578611","https://openalex.org/W2407022425","https://openalex.org/W2535838896","https://openalex.org/W2541884796","https://openalex.org/W2579247884","https://openalex.org/W2606891064","https://openalex.org/W2921802966","https://openalex.org/W2949117887","https://openalex.org/W2963446712","https://openalex.org/W2963803379","https://openalex.org/W4255949318","https://openalex.org/W6628377381","https://openalex.org/W6631190155","https://openalex.org/W6635446068","https://openalex.org/W6636649193","https://openalex.org/W6638667902","https://openalex.org/W6674330103","https://openalex.org/W6679154944","https://openalex.org/W6680402377","https://openalex.org/W6684249991","https://openalex.org/W6684859321","https://openalex.org/W6687494587","https://openalex.org/W6713835734","https://openalex.org/W6714239094","https://openalex.org/W6728757088","https://openalex.org/W6729239390","https://openalex.org/W6738460352","https://openalex.org/W6743846187","https://openalex.org/W6746200960","https://openalex.org/W6746839373","https://openalex.org/W6748019269","https://openalex.org/W6748579526","https://openalex.org/W6751521026","https://openalex.org/W6754341472","https://openalex.org/W6754416507","https://openalex.org/W6755593096","https://openalex.org/W6758358981","https://openalex.org/W6760157594","https://openalex.org/W6898611122"],"related_works":["https://openalex.org/W2978015420","https://openalex.org/W2407022425","https://openalex.org/W3124591689","https://openalex.org/W2994817185","https://openalex.org/W3208617247","https://openalex.org/W3111857673","https://openalex.org/W2338908902","https://openalex.org/W2969797940","https://openalex.org/W3174911677","https://openalex.org/W2918006316","https://openalex.org/W3126221229","https://openalex.org/W3104920644","https://openalex.org/W3189274515","https://openalex.org/W2752698706","https://openalex.org/W3164411344","https://openalex.org/W2921965200","https://openalex.org/W2515193474","https://openalex.org/W3211659500","https://openalex.org/W3136839710","https://openalex.org/W3188694252"],"abstract_inverted_index":{"Currently,":[0],"progressively":[1],"larger":[2],"deep":[3],"neural":[4,136],"networks":[5],"are":[6,18],"trained":[7],"on":[8,129,163],"ever":[9],"growing":[10],"data":[11],"corpora.":[12],"In":[13,191],"result,":[14],"distributed":[15,26,65],"training":[16,27],"schemes":[17],"becoming":[19],"increasingly":[20],"relevant.":[21],"A":[22],"major":[23],"issue":[24],"in":[25,40,152,165],"is":[28,200],"the":[29,113,116,126,149,166,172,192,195],"limited":[30],"communication":[31,38,62,72,128,198],"bandwidth":[32],"between":[33],"contributing":[34],"nodes":[35],"or":[36,179],"prohibitive":[37],"cost":[39,63],"general.":[41],"To":[42],"mitigate":[43],"this":[44],"problem":[45],"we":[46,159],"propose":[47],"Sparse":[48],"Binary":[49],"Compression":[50],"(SBC),":[51],"a":[52,58,78,130,183],"compression":[53,89],"framework":[54],"that":[55,122],"allows":[56,100],"for":[57,64,208],"drastic":[59],"reduction":[60],"of":[61,71,115,132,144,154,169],"training.":[66],"SBC":[67,123],"combines":[68],"existing":[69],"techniques":[70],"delay":[73],"and":[74,82,107,134],"gradient":[75,105],"sparsification":[76],"with":[77],"novel":[79],"binarization":[80],"method":[81,98],"optimal":[83],"weight":[84],"update":[85],"encoding":[86],"to":[87,91,102,110,112,171,182,205],"push":[88],"gains":[90],"new":[92],"limits.":[93],"By":[94],"doing":[95],"so,":[96],"our":[97],"also":[99],"us":[101],"smoothly":[103],"trade-off":[104],"sparsity":[106,109],"temporal":[108],"adapt":[111],"requirements":[114],"learning":[117],"task.":[118],"Our":[119],"experiments":[120],"show,":[121],"can":[124,160],"reduce":[125],"upstream":[127,197],"variety":[131],"convolutional":[133],"recurrent":[135],"network":[137],"architectures":[138],"by":[139],"more":[140],"than":[141],"four":[142],"orders":[143],"magnitude":[145],"without":[146],"significantly":[147],"harming":[148],"convergence":[150],"speed":[151],"terms":[153],"forward-backward":[155],"passes.":[156],"For":[157],"instance,":[158],"train":[161,180],"ResNet50":[162],"ImageNet":[164],"same":[167],"number":[168],"iterations":[170],"baseline":[173],"accuracy,":[174],"using":[175,187],"\u00d73531":[176],"less":[177,189],"bits":[178],"it":[181],"1%":[184],"lower":[185],"accuracy":[186],"\u00d737208":[188],"bits.":[190],"latter":[193],"case,":[194],"total":[196],"required":[199],"cut":[201],"from":[202],"125":[203],"terabytes":[204],"3.35":[206],"gigabytes":[207],"every":[209],"participating":[210],"client.":[211]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
