{"id":"https://openalex.org/W2743167307","doi":"https://doi.org/10.1145/3097983.3098080","title":"Communication-Efficient Distributed Block Minimization for Nonlinear Kernel Machines","display_name":"Communication-Efficient Distributed Block Minimization for Nonlinear Kernel Machines","publication_year":2017,"publication_date":"2017-08-04","ids":{"openalex":"https://openalex.org/W2743167307","doi":"https://doi.org/10.1145/3097983.3098080","mag":"2743167307"},"language":"en","primary_location":{"id":"doi:10.1145/3097983.3098080","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3097983.3098080","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010841999","display_name":"Cho\u2010Jui Hsieh","orcid":"https://orcid.org/0000-0002-3520-9627"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Cho-Jui Hsieh","raw_affiliation_strings":["University of California, Davis, Davis, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California, Davis, Davis, CA, USA","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001215167","display_name":"Si Si","orcid":"https://orcid.org/0000-0002-2406-7221"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Si Si","raw_affiliation_strings":["Google Inc. &amp; Google Research, Mountain View, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Inc. &amp; Google Research, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063459703","display_name":"Inderjit S. Dhillon","orcid":"https://orcid.org/0000-0002-2759-1416"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Inderjit S. Dhillon","raw_affiliation_strings":["University of Texas at Austin, Austin, TX, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Texas at Austin, Austin, TX, USA","institution_ids":["https://openalex.org/I86519309"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.6196,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.77199379,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"245","last_page":"254"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6604985594749451},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.639952540397644},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6342378258705139},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5782535076141357},{"id":"https://openalex.org/keywords/hessian-matrix","display_name":"Hessian matrix","score":0.5235055088996887},{"id":"https://openalex.org/keywords/kernel-method","display_name":"Kernel method","score":0.5139421820640564},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5093556642532349},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.49942922592163086},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.49106597900390625},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.45895251631736755},{"id":"https://openalex.org/keywords/radial-basis-function-kernel","display_name":"Radial basis function kernel","score":0.45506665110588074},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.26120707392692566},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22006061673164368},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.09773749113082886}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6604985594749451},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.639952540397644},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6342378258705139},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5782535076141357},{"id":"https://openalex.org/C203616005","wikidata":"https://www.wikidata.org/wiki/Q620495","display_name":"Hessian matrix","level":2,"score":0.5235055088996887},{"id":"https://openalex.org/C122280245","wikidata":"https://www.wikidata.org/wiki/Q620622","display_name":"Kernel method","level":3,"score":0.5139421820640564},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5093556642532349},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.49942922592163086},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.49106597900390625},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.45895251631736755},{"id":"https://openalex.org/C75866337","wikidata":"https://www.wikidata.org/wiki/Q7280263","display_name":"Radial basis function kernel","level":4,"score":0.45506665110588074},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.26120707392692566},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22006061673164368},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.09773749113082886},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3097983.3098080","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3097983.3098080","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1463675261","display_name":null,"funder_award_id":"CCF-1320746","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5682525824","display_name":null,"funder_award_id":"IIS-1546452","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G679029799","display_name":null,"funder_award_id":"CCF-1564000","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1486305586","https://openalex.org/W1506135481","https://openalex.org/W1512098439","https://openalex.org/W1522126829","https://openalex.org/W1576520375","https://openalex.org/W1697545848","https://openalex.org/W1842246424","https://openalex.org/W1842705303","https://openalex.org/W1946315329","https://openalex.org/W1990470142","https://openalex.org/W2032395696","https://openalex.org/W2070272652","https://openalex.org/W2099262739","https://openalex.org/W2108712612","https://openalex.org/W2112545207","https://openalex.org/W2115975329","https://openalex.org/W2117669906","https://openalex.org/W2117990954","https://openalex.org/W2118563516","https://openalex.org/W2123154536","https://openalex.org/W2135910425","https://openalex.org/W2138064276","https://openalex.org/W2139224857","https://openalex.org/W2144902422","https://openalex.org/W2170796499","https://openalex.org/W2171602483","https://openalex.org/W2278578264","https://openalex.org/W2293711698","https://openalex.org/W2350220533","https://openalex.org/W2553080076","https://openalex.org/W2578798508","https://openalex.org/W2584746436","https://openalex.org/W2606823780","https://openalex.org/W2912728463","https://openalex.org/W2963861706","https://openalex.org/W3007502339"],"related_works":["https://openalex.org/W1603091392","https://openalex.org/W3123056048","https://openalex.org/W4389428786","https://openalex.org/W2079825755","https://openalex.org/W4389251307","https://openalex.org/W4386075310","https://openalex.org/W2089892314","https://openalex.org/W2974741803","https://openalex.org/W1983263273","https://openalex.org/W3024148442"],"abstract_inverted_index":{"Nonlinear":[0],"kernel":[1,32,54,111,148,194,216,243],"machines":[2,33,252],"often":[3],"yield":[4],"superior":[5],"predictive":[6],"performance":[7],"on":[8,151,166],"various":[9],"tasks;":[10],"however,":[11],"they":[12],"suffer":[13],"from":[14],"severe":[15],"computational":[16],"challenges.":[17],"In":[18,37],"this":[19,265],"paper,":[20],"we":[21,39],"show":[22,155],"how":[23],"to":[24,96,145,202,222,264],"overcome":[25],"the":[26,64,75,101,107,120,167,191,213,227,242],"important":[27],"challenge":[28],"of":[29,74,100,110,119,127],"speeding":[30],"up":[31],"using":[34,186,250],"multiple":[35],"computers.":[36],"particular,":[38],"develop":[40],"a":[41,71,88,124,156,204],"parallel":[42,161,193,238],"block":[43],"minimization":[44],"framework,":[45],"and":[46,56,130,136,154,233],"demonstrate":[47],"its":[48],"good":[49],"scalability":[50],"in":[51,84,183,256],"solving":[52],"nonlinear":[53],"SVM":[55,149,195,217,244],"logistic":[57],"regression.":[58],"Our":[59],"framework":[60],"proceeds":[61],"by":[62,69,105],"dividing":[63],"problem":[65,108],"into":[66],"smaller":[67],"subproblems":[68,79],"forming":[70],"block-diagonal":[72],"approximation":[73],"Hessian":[76],"matrix.":[77],"The":[78],"are":[80],"then":[81],"solved":[82],"approximately":[83],"parallel.":[85],"After":[86],"that,":[87],"communication":[89],"efficient":[90],"line":[91],"search":[92],"procedure":[93],"is":[94,212],"developed":[95],"ensure":[97],"sufficient":[98],"reduction":[99],"objective":[102],"function":[103],"value":[104],"exploiting":[106],"structure":[109],"machines.":[112],"We":[113,141],"prove":[114],"global":[115],"linear":[116],"convergence":[117],"rate":[118],"proposed":[121],"method":[122],"with":[123,170,180,206,253],"wide":[125],"class":[126],"subproblem":[128],"solvers,":[129],"our":[131,143,173,210,237],"analysis":[132],"covers":[133],"strongly":[134],"convex":[135,139],"some":[137],"non-strongly":[138],"functions.":[140],"apply":[142],"algorithm":[144,174,211],"solve":[146],"large-scale":[147],"problems":[150],"distributed":[152,215],"systems,":[153],"significant":[157],"improvement":[158],"over":[159],"existing":[160,259],"solvers.":[162],"As":[163],"an":[164,177,248],"example,":[165],"covtype":[168],"dataset":[169,229],"half-a-million":[171],"samples,":[172],"can":[175,220,240,261],"obtain":[176],"approximate":[178],"solution":[179,205,245],"96%":[181],"accuracy":[182],"20":[184],"seconds":[185,201],"32":[187,251],"machines,":[188],"while":[189,258],"all":[190],"other":[192],"solvers":[196,260],"require":[197],"more":[198],"than":[199],"2000":[200],"achieve":[203],"95%":[207],"accuracy.":[208],"Moreover,":[209],"first":[214],"solver":[218,239],"that":[219],"scale":[221,263],"massive":[223],"data":[224],"sets.":[225],"On":[226],"KDDB":[228],"(20":[230],"million":[231,235],"samples":[232],"30":[234],"features),":[236],"compute":[241],"within":[246],"half":[247],"hour":[249],"640":[254],"cores":[255],"total,":[257],"not":[262],"dataset.":[266]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
