{"id":"https://openalex.org/W3022815319","doi":"https://doi.org/10.1145/3425500","title":"Accelerating Deep Neuroevolution on Distributed FPGAs for Reinforcement Learning Problems","display_name":"Accelerating Deep Neuroevolution on Distributed FPGAs for Reinforcement Learning Problems","publication_year":2021,"publication_date":"2021-04-05","ids":{"openalex":"https://openalex.org/W3022815319","doi":"https://doi.org/10.1145/3425500","mag":"3022815319"},"language":"en","primary_location":{"id":"doi:10.1145/3425500","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3425500","pdf_url":null,"source":{"id":"https://openalex.org/S96198239","display_name":"ACM Journal on Emerging Technologies in Computing Systems","issn_l":"1550-4832","issn":["1550-4832","1550-4840"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Journal on Emerging Technologies in Computing Systems","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2005.04536","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Alexis Asseman","orcid":null},"institutions":[{"id":"https://openalex.org/I4210085935","display_name":"IBM Research - Almaden","ror":"https://ror.org/005w8dd04","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210085935","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alexis Asseman","raw_affiliation_strings":["IBM Almaden Research Center, California, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Almaden Research Center, California, USA","institution_ids":["https://openalex.org/I4210085935"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Nicolas Antoine","orcid":null},"institutions":[{"id":"https://openalex.org/I4210085935","display_name":"IBM Research - Almaden","ror":"https://ror.org/005w8dd04","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210085935","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nicolas Antoine","raw_affiliation_strings":["IBM Almaden Research Center, California, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Almaden Research Center, California, USA","institution_ids":["https://openalex.org/I4210085935"]}]},{"author_position":"last","author":{"id":null,"display_name":"Ahmet S. Ozcan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210085935","display_name":"IBM Research - Almaden","ror":"https://ror.org/005w8dd04","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210085935","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ahmet S. Ozcan","raw_affiliation_strings":["IBM Almaden Research Center, California, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Almaden Research Center, California, USA","institution_ids":["https://openalex.org/I4210085935"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.5597,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.7165719,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"17","issue":"2","first_page":"1","last_page":"17"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.6401000022888184,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.6401000022888184,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.10209999978542328,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.04729999974370003,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/neuroevolution","display_name":"Neuroevolution","score":0.9470000267028809},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6922000050544739},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6527000069618225},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5760999917984009},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.5407000184059143},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.5350000262260437},{"id":"https://openalex.org/keywords/ibm","display_name":"IBM","score":0.5224000215530396},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.43630000948905945}],"concepts":[{"id":"https://openalex.org/C118070581","wikidata":"https://www.wikidata.org/wiki/Q2060528","display_name":"Neuroevolution","level":3,"score":0.9470000267028809},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7833999991416931},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6922000050544739},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6527000069618225},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5778999924659729},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5760999917984009},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.5407000184059143},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.5350000262260437},{"id":"https://openalex.org/C70388272","wikidata":"https://www.wikidata.org/wiki/Q5968558","display_name":"IBM","level":2,"score":0.5224000215530396},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.43630000948905945},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.4099000096321106},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3896999955177307},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.38830000162124634},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.37720000743865967},{"id":"https://openalex.org/C8880873","wikidata":"https://www.wikidata.org/wiki/Q187787","display_name":"Genetic algorithm","level":2,"score":0.3181999921798706},{"id":"https://openalex.org/C3018412434","wikidata":"https://www.wikidata.org/wiki/Q7889","display_name":"Video game","level":2,"score":0.3043999969959259},{"id":"https://openalex.org/C86111242","wikidata":"https://www.wikidata.org/wiki/Q859595","display_name":"Coprocessor","level":2,"score":0.27459999918937683},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.2727999985218048},{"id":"https://openalex.org/C106515295","wikidata":"https://www.wikidata.org/wiki/Q26806595","display_name":"Parallel processing","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.26350000500679016},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.25859999656677246},{"id":"https://openalex.org/C121835503","wikidata":"https://www.wikidata.org/wiki/Q2596288","display_name":"Evolutionary programming","level":3,"score":0.2554999887943268},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.2554999887943268}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3425500","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3425500","pdf_url":null,"source":{"id":"https://openalex.org/S96198239","display_name":"ACM Journal on Emerging Technologies in Computing Systems","issn_l":"1550-4832","issn":["1550-4832","1550-4840"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Journal on Emerging Technologies in Computing Systems","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2005.04536","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2005.04536","pdf_url":"https://arxiv.org/pdf/2005.04536","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2005.04536","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2005.04536","pdf_url":"https://arxiv.org/pdf/2005.04536","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1925894136","https://openalex.org/W2325896489","https://openalex.org/W2565125333","https://openalex.org/W2580909119","https://openalex.org/W2588283865","https://openalex.org/W2625954420","https://openalex.org/W2796625795","https://openalex.org/W2810478946","https://openalex.org/W2899915146","https://openalex.org/W2931767035","https://openalex.org/W2962991582","https://openalex.org/W3011985620","https://openalex.org/W3130537609"],"related_works":[],"abstract_inverted_index":{"Reinforcement":[0],"learning,":[1],"augmented":[2],"by":[3],"the":[4,26,89,95,104,109,114,119,158,162],"representational":[5],"power":[6],"of":[7,29,88,131,161],"deep":[8,47,79],"neural":[9,96],"networks,":[10],"has":[11],"shown":[12],"promising":[13],"results":[14,51,112],"on":[15,56,82,118],"high-dimensional":[16],"problems,":[17],"such":[18,42],"as":[19,43],"game":[20,90],"playing":[21],"and":[22,46,94],"robotic":[23],"control.":[24],"However,":[25],"sequential":[27],"nature":[28],"these":[30],"problems":[31],"poses":[32],"a":[33,125,137],"fundamental":[34],"challenge":[35],"for":[36,74,153],"computational":[37],"efficiency.":[38],"Recently,":[39],"alternative":[40],"approaches":[41],"evolutionary":[44],"strategies":[45],"neuroevolution":[48,80],"demonstrated":[49],"competitive":[50],"with":[52,103],"faster":[53],"training":[54,64],"time":[55],"distributed":[57,83],"CPU":[58,159],"cores.":[59],"Here":[60],"we":[61],"report":[62],"record":[63],"times":[65],"(running":[66],"at":[67],"about":[68],"1":[69],"million":[70],"frames":[71],"per":[72],"second)":[73],"Atari":[75],"2600":[76],"games":[77,155],"using":[78],"implemented":[81],"FPGAs.":[84],"Combined":[85],"hardware":[86],"implementation":[87,160],"console,":[91],"image":[92],"preprocessing":[93],"network":[97,140],"in":[98,136,151],"an":[99],"optimized":[100],"pipeline,":[101],"multiplied":[102],"system":[105,128],"level":[106],"parallelism":[107],"enabled":[108],"acceleration.":[110],"These":[111],"are":[113],"first":[115],"application":[116],"demonstration":[117],"IBM":[120],"Neural":[121],"Computer,":[122],"which":[123],"is":[124],"custom":[126],"designed":[127],"that":[129],"consists":[130],"432":[132],"Xilinx":[133],"FPGAs":[134],"interconnected":[135],"3D":[138],"mesh":[139],"topology.":[141],"In":[142],"addition":[143],"to":[144,157],"high":[145],"performance,":[146],"experiments":[147],"also":[148],"showed":[149],"improvement":[150],"accuracy":[152],"all":[154],"compared":[156],"same":[163],"algorithm.":[164]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2}],"updated_date":"2026-06-13T07:54:00.901334","created_date":"2020-05-13T00:00:00"}
