{"id":"https://openalex.org/W3046818610","doi":"https://doi.org/10.1145/3377929.3389915","title":"Population-based evolutionary distributed SGD","display_name":"Population-based evolutionary distributed SGD","publication_year":2020,"publication_date":"2020-07-08","ids":{"openalex":"https://openalex.org/W3046818610","doi":"https://doi.org/10.1145/3377929.3389915","mag":"3046818610"},"language":"en","primary_location":{"id":"doi:10.1145/3377929.3389915","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3377929.3389915","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 Genetic and Evolutionary Computation Conference Companion","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.research.ed.ac.uk/en/publications/f9fc0b23-ce48-4f91-83eb-cf2b1d621714","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055844003","display_name":"Amna Shahab","orcid":"https://orcid.org/0000-0001-9896-1763"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Amna Shahab","raw_affiliation_strings":["University of Edinburgh"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010276850","display_name":"Boris Grot","orcid":"https://orcid.org/0000-0001-6525-0762"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Boris Grot","raw_affiliation_strings":["University of Edinburgh"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5055844003"],"corresponding_institution_ids":["https://openalex.org/I98677209"],"apc_list":null,"apc_paid":null,"fwci":0.3977,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.68450813,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"153","last_page":"154"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.801110029220581},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.78513503074646},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.6925910115242004},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.5266387462615967},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.48708319664001465},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4744991958141327},{"id":"https://openalex.org/keywords/evolutionary-algorithm","display_name":"Evolutionary algorithm","score":0.4734758138656616},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.4432421922683716},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4320615231990814},{"id":"https://openalex.org/keywords/limit","display_name":"Limit (mathematics)","score":0.43071433901786804},{"id":"https://openalex.org/keywords/complementarity","display_name":"Complementarity (molecular biology)","score":0.428339421749115},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.4144981801509857},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.320161908864975},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3091876804828644},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0836181640625}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.801110029220581},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.78513503074646},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.6925910115242004},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.5266387462615967},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.48708319664001465},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4744991958141327},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.4734758138656616},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.4432421922683716},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4320615231990814},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.43071433901786804},{"id":"https://openalex.org/C202269582","wikidata":"https://www.wikidata.org/wiki/Q2644277","display_name":"Complementarity (molecular biology)","level":2,"score":0.428339421749115},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.4144981801509857},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.320161908864975},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3091876804828644},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0836181640625},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3377929.3389915","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3377929.3389915","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 Genetic and Evolutionary Computation Conference Companion","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.ed.ac.uk:openaire/f9fc0b23-ce48-4f91-83eb-cf2b1d621714","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/f9fc0b23-ce48-4f91-83eb-cf2b1d621714","pdf_url":null,"source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Shahab, A & Grot, B 2020, Population-based Evolutionary Distributed SGD. in Proceedings of the 2020 Genetic and Evolutionary Computation Conference Companion : GECCO '20. Association for Computing Machinery (ACM), pp. 153\u2013154, The Genetic and Evolutionary Computation Conference 2020, Cancun, Mexico, 8/07/20. https://doi.org/10.1145/3377929.3389915","raw_type":"contributionToPeriodical"},{"id":"pmh:oai:pure.ed.ac.uk:publications/f9fc0b23-ce48-4f91-83eb-cf2b1d621714","is_oa":false,"landing_page_url":"https://www.research.ed.ac.uk/portal/en/publications/populationbased-evolutionary-distributed-sgd(f9fc0b23-ce48-4f91-83eb-cf2b1d621714).html","pdf_url":null,"source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""}],"best_oa_location":{"id":"pmh:oai:pure.ed.ac.uk:openaire/f9fc0b23-ce48-4f91-83eb-cf2b1d621714","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/f9fc0b23-ce48-4f91-83eb-cf2b1d621714","pdf_url":null,"source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Shahab, A & Grot, B 2020, Population-based Evolutionary Distributed SGD. in Proceedings of the 2020 Genetic and Evolutionary Computation Conference Companion : GECCO '20. Association for Computing Machinery (ACM), pp. 153\u2013154, The Genetic and Evolutionary Computation Conference 2020, Cancun, Mexico, 8/07/20. https://doi.org/10.1145/3377929.3389915","raw_type":"contributionToPeriodical"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5811753289","display_name":null,"funder_award_id":"EP/M507258/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2344075909","https://openalex.org/W2479609865","https://openalex.org/W2593744649","https://openalex.org/W2884711234","https://openalex.org/W2890850833","https://openalex.org/W2909837330","https://openalex.org/W2963959597","https://openalex.org/W2964352239","https://openalex.org/W2970139027","https://openalex.org/W2994848047"],"related_works":["https://openalex.org/W2950520577","https://openalex.org/W1554644772","https://openalex.org/W2003935582","https://openalex.org/W2494130044","https://openalex.org/W3170887803","https://openalex.org/W74409296","https://openalex.org/W3209384898","https://openalex.org/W4400951174","https://openalex.org/W1595834484","https://openalex.org/W1991844655"],"abstract_inverted_index":{"Neural":[0],"model":[1,121],"training":[2,24,70,74,83,86,122],"is":[3,10,26],"a":[4,27,44,64,89,101],"time-consuming":[5],"task":[6],"where":[7],"exploiting":[8],"parallelism":[9],"of":[11,42,53,104,115],"utmost":[12],"importance.":[13],"Employing":[14],"data-parallelism":[15],"in":[16,127],"stochastic":[17],"gradient":[18],"descent":[19],"(SGD)":[20],"by":[21],"partitioning":[22],"the":[23,40,47,51,95,107,113],"dataset":[25],"popular":[28],"approach;":[29],"however,":[30],"algorithmic":[31],"inefficiencies":[32],"when":[33],"operating":[34],"at":[35],"large":[36],"minibatch":[37],"sizes":[38],"limit":[39],"degree":[41],"parallelism,":[43],"problem":[45],"termed":[46],"scalability":[48,55],"limit.":[49],"In":[50],"face":[52],"this":[54],"challenge,":[56],"we":[57],"propose":[58],"using":[59],"Evolutionary":[60],"Algorithms":[61],"(EA)":[62],"as":[63],"meta-algorithm":[65],"together":[66],"with":[67,88],"SGD":[68,82,116],"for":[69,106,119],"neural":[71,120],"models.":[72],"Our":[73],"scheme,":[75],"<u>P</u>opulation-based":[76],"<u>E</u>volutionary":[77],"<u>SGD</u>":[78],"(PESGD)":[79],"combines":[80],"local":[81],"on":[84],"each":[85],"node":[87],"periodic":[90],"evolutionary":[91],"step":[92],"which":[93],"selects":[94],"best":[96],"performing":[97],"models":[98,105],"to":[99],"generate":[100],"new":[102],"population":[103],"next":[108],"iteration.":[109],"We":[110],"believe":[111],"that":[112],"complementarity":[114],"and":[117],"EA":[118],"can":[123],"be":[124],"exploited":[125],"well":[126],"PESGD.":[128]},"counts_by_year":[{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
