{"id":"https://openalex.org/W7130555333","doi":"https://doi.org/10.1109/apccas67402.2025.11376621","title":"Improvement of A2C Training Efficiency with FSM-Based Meta-Optimizer on CPU-FPGA Platform","display_name":"Improvement of A2C Training Efficiency with FSM-Based Meta-Optimizer on CPU-FPGA Platform","publication_year":2025,"publication_date":"2025-10-12","ids":{"openalex":"https://openalex.org/W7130555333","doi":"https://doi.org/10.1109/apccas67402.2025.11376621"},"language":null,"primary_location":{"id":"doi:10.1109/apccas67402.2025.11376621","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apccas67402.2025.11376621","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Asia Pacific Conference on Circuits and Systems (APCCAS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120386279","display_name":"Chavakorn Somjaisuk","orcid":"https://orcid.org/0009-0001-3481-7962"},"institutions":[{"id":"https://openalex.org/I35568498","display_name":"Kochi University of Technology","ror":"https://ror.org/00rghrr56","country_code":"JP","type":"education","lineage":["https://openalex.org/I35568498"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Chavakorn Somjaisuk","raw_affiliation_strings":["Kochi University of Technology,Department of Engineering,Kami,Kochi,Japan,782-8502"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Kochi University of Technology,Department of Engineering,Kami,Kochi,Japan,782-8502","institution_ids":["https://openalex.org/I35568498"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015621925","display_name":"Yukio Mitsuyama","orcid":"https://orcid.org/0000-0001-8151-0085"},"institutions":[{"id":"https://openalex.org/I35568498","display_name":"Kochi University of Technology","ror":"https://ror.org/00rghrr56","country_code":"JP","type":"education","lineage":["https://openalex.org/I35568498"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yukio Mitsuyama","raw_affiliation_strings":["Kochi University of Technology,Department of Engineering,Kami,Kochi,Japan,782-8502"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Kochi University of Technology,Department of Engineering,Kami,Kochi,Japan,782-8502","institution_ids":["https://openalex.org/I35568498"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.81685914,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.11339999735355377,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.11339999735355377,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.08240000158548355,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.07429999858140945,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6105999946594238},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5133000016212463},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.5077999830245972},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.49309998750686646},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.49000000953674316},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.4837999939918518},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.478300005197525},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.44449999928474426},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.4277999997138977}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6269000172615051},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6105999946594238},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5133000016212463},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.5077999830245972},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.49309998750686646},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.49000000953674316},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.4837999939918518},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.478300005197525},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.47530001401901245},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.44449999928474426},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.4277999997138977},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4253999888896942},{"id":"https://openalex.org/C167822520","wikidata":"https://www.wikidata.org/wiki/Q176452","display_name":"Finite-state machine","level":2,"score":0.4032000005245209},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.3646000027656555},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3612000048160553},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.352400004863739},{"id":"https://openalex.org/C2984118289","wikidata":"https://www.wikidata.org/wiki/Q29954","display_name":"Power consumption","level":3,"score":0.3504999876022339},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.34290000796318054},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.33959999680519104},{"id":"https://openalex.org/C173018170","wikidata":"https://www.wikidata.org/wiki/Q165678","display_name":"Microcontroller","level":2,"score":0.3375999927520752},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.3034000098705292},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.29670000076293945},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.29089999198913574},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2903999984264374},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.28110000491142273},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.2694999873638153},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.25540000200271606}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apccas67402.2025.11376621","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apccas67402.2025.11376621","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Asia Pacific Conference on Circuits and Systems (APCCAS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.9035303592681885,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":3,"referenced_works":["https://openalex.org/W2416799949","https://openalex.org/W2904195769","https://openalex.org/W3035681682"],"related_works":[],"abstract_inverted_index":{"The":[0,63],"demand":[1],"for":[2,168],"intelligent":[3],"edge":[4,172],"devices":[5],"with":[6],"ondevice":[7],"learning":[8,73,176],"is":[9,66],"increasing,":[10],"enabling":[11],"real-time":[12],"adaptation":[13],"without":[14],"reliance":[15],"on":[16,30,76,81,129],"the":[17,82,85,134,179],"cloud.":[18],"However,":[19],"deploying":[20],"Deep":[21],"Reinforcement":[22],"Learning":[23],"(DRL)":[24],"algorithms":[25],"like":[26],"Advantage":[27],"ActorCritic":[28],"(A2C)":[29],"such":[31],"platforms":[32],"remains":[33],"challenging":[34],"due":[35],"to":[36,59,98,124],"slow":[37],"convergence":[38,93],"and":[39,88,147,161],"high":[40],"power":[41],"consumption.":[42],"This":[43,111,156],"work":[44],"presents":[45],"an":[46,130],"A2C":[47,87],"system":[48,91],"enhanced":[49],"by":[50,102,118],"a":[51,67,103,165],"hardware-friendly":[52],"Finite":[53],"State":[54],"Machine":[55],"(FSM)":[56],"based":[57,75],"meta-optimizer":[58,90],"improve":[60],"training":[61,113,160],"efficiency.":[62,155],"system's":[64],"core":[65],"lightweight":[68],"FSM":[69,135],"that":[70],"adaptively":[71],"tunes":[72],"rates":[74],"reward":[77],"trend":[78],"analysis.":[79],"Evaluated":[80],"CartPole-v1":[83],"benchmark,":[84],"integrated":[86],"FSM-based":[89],"enables":[92],"in":[94,178],"513":[95],"episodes,":[96],"compared":[97],"758":[99],"episodes":[100],"required":[101],"baseline":[104],"A2C,":[105],"achieving":[106],"32.3":[107],"%":[108,120,140,144,149],"faster":[109],"convergence.":[110],"accelerated":[112,159],"reduces":[114],"total":[115],"energy":[116],"consumption":[117],"58.6":[119],"(from":[121],"915.2":[122],"kJ":[123],"378.81":[125],"kJ).":[126],"Post-synthesis":[127],"results":[128],"Ultra96-V2":[131],"FPGA":[132],"show":[133],"controller":[136],"consumes":[137],"only":[138],"7":[139],"of":[141,145,150,158,175],"LUTs,":[142],"6":[143],"DSPs,":[146],"5":[148],"FFs,":[151],"confirming":[152],"its":[153],"hardware":[154],"combination":[157],"minimal":[162],"overhead":[163],"demonstrates":[164],"compelling":[166],"approach":[167],"developing":[169],"low-power,":[170],"self-improving":[171],"systems":[173],"capable":[174],"directly":[177],"field.":[180]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-20T00:00:00"}
