{"id":"https://openalex.org/W2221538265","doi":"https://doi.org/10.1109/bigdata.2015.7364091","title":"Large-scale learning with AdaGrad on Spark","display_name":"Large-scale learning with AdaGrad on Spark","publication_year":2015,"publication_date":"2015-10-01","ids":{"openalex":"https://openalex.org/W2221538265","doi":"https://doi.org/10.1109/bigdata.2015.7364091","mag":"2221538265"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2015.7364091","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2015.7364091","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026382684","display_name":"Asmelash Teka Hadgu","orcid":"https://orcid.org/0000-0002-4012-3772"},"institutions":[{"id":"https://openalex.org/I4210136150","display_name":"L3S Research Center","ror":"https://ror.org/039t4wk02","country_code":"DE","type":"facility","lineage":["https://openalex.org/I114112103","https://openalex.org/I4210136150","https://openalex.org/I94509681"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Asmelash Teka Hadgu","raw_affiliation_strings":["L3S Research Center, Hannover, Germany"],"affiliations":[{"raw_affiliation_string":"L3S Research Center, Hannover, Germany","institution_ids":["https://openalex.org/I4210136150"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077135517","display_name":"Aastha Nigam","orcid":null},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aastha Nigam","raw_affiliation_strings":["University of Notre Dame, Indiana, USA"],"affiliations":[{"raw_affiliation_string":"University of Notre Dame, Indiana, USA","institution_ids":["https://openalex.org/I107639228"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002826517","display_name":"Ernesto Diaz-Aviles","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145784","display_name":"IBM Research - Ireland","ror":"https://ror.org/04jnxr720","country_code":"IE","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210145784"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Ernesto Diaz-Aviles","raw_affiliation_strings":["IBM Research, Dublin, Ireland"],"affiliations":[{"raw_affiliation_string":"IBM Research, Dublin, Ireland","institution_ids":["https://openalex.org/I4210145784"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5026382684"],"corresponding_institution_ids":["https://openalex.org/I4210136150"],"apc_list":null,"apc_paid":null,"fwci":5.1773,"has_fulltext":false,"cited_by_count":50,"citation_normalized_percentile":{"value":0.95696334,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2828","last_page":"2830"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8052971363067627},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.709846019744873},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.6853640675544739},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.661773681640625},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6345090270042419},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6104686260223389},{"id":"https://openalex.org/keywords/online-machine-learning","display_name":"Online machine learning","score":0.6000601649284363},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.509966254234314},{"id":"https://openalex.org/keywords/active-learning","display_name":"Active learning (machine learning)","score":0.31185609102249146},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.20573529601097107},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.13838934898376465},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.1320987343788147}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8052971363067627},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.709846019744873},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.6853640675544739},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.661773681640625},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6345090270042419},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6104686260223389},{"id":"https://openalex.org/C115903097","wikidata":"https://www.wikidata.org/wiki/Q7094097","display_name":"Online machine learning","level":3,"score":0.6000601649284363},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.509966254234314},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.31185609102249146},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.20573529601097107},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.13838934898376465},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.1320987343788147},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2015.7364091","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2015.7364091","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W410850256","https://openalex.org/W1556219185","https://openalex.org/W1994616650","https://openalex.org/W2001575213","https://openalex.org/W2146502635","https://openalex.org/W2963288913","https://openalex.org/W6614148910","https://openalex.org/W6681435938"],"related_works":["https://openalex.org/W2974335793","https://openalex.org/W2790778417","https://openalex.org/W3196155444","https://openalex.org/W3025582806","https://openalex.org/W2792987183","https://openalex.org/W2954428433","https://openalex.org/W3210156800","https://openalex.org/W2295628041","https://openalex.org/W2239420864","https://openalex.org/W2969890106"],"abstract_inverted_index":{"Stochastic":[0],"Gradient":[1],"Descent":[2],"(SGD)":[3],"is":[4,37,40,94],"a":[5,67,79,95,130,194],"simple":[6],"yet":[7],"very":[8],"efficient":[9],"online":[10],"learning":[11,31,44,69,87,145,159],"algorithm":[12],"for":[13,71,84,141],"optimizing":[14],"convex":[15],"(and":[16],"often":[17],"non-convex)":[18],"functions":[19],"and":[20,104,133,164,199],"one":[21],"of":[22,35,55,58,82,162,169],"the":[23,43,56,59,157,172],"most":[24],"popular":[25],"stochastic":[26],"optimization":[27],"methods":[28],"in":[29,62,111,156,177],"machine":[30,86,144,158],"today.":[32],"One":[33],"drawback":[34],"SGD":[36,173],"that":[38,100,186],"it":[39,135,139],"sensitive":[41],"to":[42,65,108,113,126],"rate":[45,70],"hyper-parameter.":[46],"The":[47],"Adaptive":[48],"Sub-gradient":[49],"Descent,":[50],"AdaGrad,":[51],"dynamically":[52],"incorporates":[53],"knowledge":[54],"geometry":[57],"data":[60,128],"observed":[61],"earlier":[63],"iterations":[64],"calculate":[66],"different":[68],"every":[72],"feature.":[73],"In":[74],"this":[75],"work,":[76],"we":[77,183],"implement":[78],"distributed":[80],"version":[81],"AdaGrad":[83,170,187],"large-scale":[85,153],"tasks":[88,161],"using":[89],"Apache":[90,92],"Spark.":[91],"Spark":[93],"fast":[96,198],"cluster":[97],"computing":[98],"engine":[99],"provides":[101],"similar":[102],"scalability":[103],"fault":[105],"tolerance":[106],"properties":[107],"MapReduce,":[109],"but":[110],"contrast":[112],"Hadoop's":[114],"two-stage":[115],"disk-based":[116],"MapReduce":[117],"paradigm,":[118],"Spark's":[119,178],"multi-stage":[120],"in-memory":[121],"primitives":[122],"allow":[123],"user":[124],"programs":[125],"load":[127],"into":[129],"cluster's":[131],"memory":[132],"query":[134],"repeatedly,":[136],"which":[137],"makes":[138],"ideal":[140],"building":[142],"scalable":[143],"applications.":[146],"We":[147],"empirically":[148],"evaluate":[149],"our":[150,167],"implementation":[151,168],"on":[152],"real-world":[154],"problems":[155],"canonical":[160],"classification":[163],"regression.":[165],"Comparing":[166],"with":[171],"scheduler":[174],"currently":[175],"available":[176],"Machine":[179],"Learning":[180],"Library":[181],"(MLlib),":[182],"experimentally":[184],"show":[185],"saves":[188],"time":[189],"by":[190],"avoiding":[191],"manually":[192],"setting":[193],"learning-rate":[195],"hyperparameter,":[196],"converges":[197],"can":[200],"even":[201],"achieve":[202],"better":[203],"generalization":[204],"errors.":[205]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
