{"id":"https://openalex.org/W4410584314","doi":"https://doi.org/10.23919/date64628.2025.10992886","title":"PEARL: FPGA-Based Reinforcement Learning Acceleration with Pipelined Parallel Environments","display_name":"PEARL: FPGA-Based Reinforcement Learning Acceleration with Pipelined Parallel Environments","publication_year":2025,"publication_date":"2025-03-31","ids":{"openalex":"https://openalex.org/W4410584314","doi":"https://doi.org/10.23919/date64628.2025.10992886"},"language":"en","primary_location":{"id":"doi:10.23919/date64628.2025.10992886","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date64628.2025.10992886","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Design, Automation &amp;amp; Test in Europe Conference (DATE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100446495","display_name":"Jiayi Li","orcid":"https://orcid.org/0009-0006-6523-1952"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiayi Li","raw_affiliation_strings":["Institute for Artificial Intelligence, Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute for Artificial Intelligence, Peking University,Beijing,China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053355595","display_name":"H. Vicky Zhao","orcid":"https://orcid.org/0000-0002-3690-9924"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongxiao Zhao","raw_affiliation_strings":["Institute for Artificial Intelligence, Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute for Artificial Intelligence, Peking University,Beijing,China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070362924","display_name":"Wenshuo Yue","orcid":"https://orcid.org/0000-0002-4339-0489"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenshuo Yue","raw_affiliation_strings":["Institute for Artificial Intelligence, Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute for Artificial Intelligence, Peking University,Beijing,China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111088901","display_name":"Yihan Fu","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yihan Fu","raw_affiliation_strings":["Institute for Artificial Intelligence, Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute for Artificial Intelligence, Peking University,Beijing,China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101228787","display_name":"Daijing Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Daijing Shi","raw_affiliation_strings":["Institute for Artificial Intelligence, Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute for Artificial Intelligence, Peking University,Beijing,China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034445385","display_name":"Anjunyi Fan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Anjunyi Fan","raw_affiliation_strings":["Institute for Artificial Intelligence, Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute for Artificial Intelligence, Peking University,Beijing,China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057584787","display_name":"Yuchao Yang","orcid":"https://orcid.org/0000-0003-4674-4059"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuchao Yang","raw_affiliation_strings":["Institute for Artificial Intelligence, Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute for Artificial Intelligence, Peking University,Beijing,China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043075091","display_name":"Bonan Yan","orcid":"https://orcid.org/0000-0002-3052-9330"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bonan Yan","raw_affiliation_strings":["Institute for Artificial Intelligence, Peking University,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute for Artificial Intelligence, Peking University,Beijing,China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100446495"],"corresponding_institution_ids":["https://openalex.org/I20231570","https://openalex.org/I4210100255"],"apc_list":null,"apc_paid":null,"fwci":1.4856,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.82891018,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11522","display_name":"VLSI and FPGA Design Techniques","score":0.9488000273704529,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11522","display_name":"VLSI and FPGA Design Techniques","score":0.9488000273704529,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9380000233650208,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9143999814987183,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8053832650184631},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7297972440719604},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.727411150932312},{"id":"https://openalex.org/keywords/acceleration","display_name":"Acceleration","score":0.7142235040664673},{"id":"https://openalex.org/keywords/pearl","display_name":"Pearl","score":0.656151533126831},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.41891953349113464},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.32885581254959106},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.26617488265037537},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.26318830251693726}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8053832650184631},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7297972440719604},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.727411150932312},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.7142235040664673},{"id":"https://openalex.org/C2779251273","wikidata":"https://www.wikidata.org/wiki/Q43436","display_name":"Pearl","level":2,"score":0.656151533126831},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.41891953349113464},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.32885581254959106},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26617488265037537},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.26318830251693726},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C27206212","wikidata":"https://www.wikidata.org/wiki/Q34178","display_name":"Theology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/date64628.2025.10992886","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date64628.2025.10992886","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Design, Automation &amp;amp; Test in Europe Conference (DATE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1891233321","https://openalex.org/W2052924095","https://openalex.org/W2091565802","https://openalex.org/W2121517924","https://openalex.org/W2128022558","https://openalex.org/W2142677441","https://openalex.org/W2150468603","https://openalex.org/W2762946676","https://openalex.org/W2766447205","https://openalex.org/W2788862220","https://openalex.org/W2798919674","https://openalex.org/W2931767035","https://openalex.org/W2952789476","https://openalex.org/W2985670337","https://openalex.org/W3035681682","https://openalex.org/W3035864994","https://openalex.org/W3036033155","https://openalex.org/W3111884232","https://openalex.org/W3128973049","https://openalex.org/W3147018723","https://openalex.org/W3213742958","https://openalex.org/W4214717370","https://openalex.org/W4229017035","https://openalex.org/W4255138242","https://openalex.org/W4302493448","https://openalex.org/W4312121009","https://openalex.org/W4321637127","https://openalex.org/W4379115908","https://openalex.org/W4391429126","https://openalex.org/W4401018608","https://openalex.org/W4401568624","https://openalex.org/W4402196955","https://openalex.org/W6635902665","https://openalex.org/W6780153092","https://openalex.org/W6839361920","https://openalex.org/W6855101350","https://openalex.org/W6857395904"],"related_works":["https://openalex.org/W4398771981","https://openalex.org/W4297824900","https://openalex.org/W2186798288","https://openalex.org/W2950290350","https://openalex.org/W761508262","https://openalex.org/W1507226244","https://openalex.org/W4248123049","https://openalex.org/W1967938402","https://openalex.org/W2386041993","https://openalex.org/W1608572506"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,7],"(RL)":[2],"is":[3,46,224],"an":[4,25,196],"effective":[5],"machine":[6],"approach":[8],"that":[9],"enables":[10],"artificial":[11],"intelligence":[12],"agents":[13,57],"to":[14,35,101,121,143,183,201],"perform":[15],"complex":[16],"tasks":[17],"and":[18,58,92,117,158,165,174,185,203,214],"make":[19],"decisions":[20],"in":[21,146,177],"dynamic":[22],"situations.":[23],"Training":[24],"RL":[26,63,84,115,212],"agent":[27],"demands":[28],"its":[29],"repetitive":[30],"interaction":[31],"with":[32,95,209],"the":[33,107,126,137,149,190,210,221],"environment":[34,133],"learn":[36],"optimal":[37],"policies.":[38],"To":[39,75],"efficiently":[40],"collect":[41],"training":[42,218],"data,":[43],"parallelizing":[44],"environments":[45,91,116,140,188],"a":[47,67,81,96],"widely":[48],"used":[49],"technique":[50],"by":[51,154,162],"enabling":[52],"simultaneous":[53],"interactions":[54],"between":[55],"multiple":[56,89],"environments.":[59],"However,":[60],"existing":[61,127,211],"CPU-based":[62],"software":[64],"frameworks":[65],"face":[66],"key":[68],"challenge":[69],"of":[70,139],"slow":[71],"multi-environmental":[72],"update":[73],"computation.":[74],"solve":[76],"this":[77],"problem,":[78],"we":[79],"present":[80],"novel":[82],"FPGA-based":[83],"accelerating":[85],"framework-PEARL.":[86],"PEARL":[87,112,180,208],"instantiates":[88],"parallel":[90,132],"accelerates":[93],"them":[94],"carefully":[97],"designed":[98],"pipeline":[99],"scheme":[100],"hide":[102],"data":[103],"transfer":[104],"latency":[105],"within":[106,189],"computation":[108],"time.":[109,219],"We":[110,193,205],"evaluate":[111],"on":[113],"respective":[114],"achieve":[118],"4.36":[119],"x":[120,123,164],"972.6":[122],"speedup":[124],"over":[125],"fastest":[128],"software-based":[129],"framework":[130,191],"for":[131,199],"execution.":[134],"When":[135],"scaling":[136],"number":[138],"from":[141],"1024":[142],"43008":[144],"(42x)":[145],"CliffWalking":[147],"benchmark,":[148],"power":[150,175],"consumption":[151],"increases":[152],"marginally":[153],"3%,":[155],"while":[156],"LUT":[157],"flip-flops":[159],"utilization":[160],"rise":[161],"2.24":[163],"3.08":[166],"x,":[167],"respectively.":[168],"This":[169],"demonstrates":[170],"efficient":[171],"resource":[172],"usage":[173],"management":[176],"PEARL.":[178],"Further,":[179],"allows":[181],"users":[182,200],"define":[184],"add":[186],"their":[187],"flexibly.":[192],"have":[194],"established":[195],"open-source":[197],"repository":[198],"utilize":[202],"expand.":[204],"also":[206],"implement":[207],"algorithm":[213],"save":[215],"7%":[216],"-15%":[217],"All":[220],"source":[222],"code":[223],"available":[225],"online":[226],"https://github.com/Selinaee/FPGA_Gym.":[227]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
