{"id":"https://openalex.org/W4412722185","doi":"https://doi.org/10.1109/tie.2025.3587123","title":"Reinforcement Learning-Based Control for Electrohydraulic Actuators: A Case Study on an Inverted Pendulum Testbench","display_name":"Reinforcement Learning-Based Control for Electrohydraulic Actuators: A Case Study on an Inverted Pendulum Testbench","publication_year":2025,"publication_date":"2025-07-29","ids":{"openalex":"https://openalex.org/W4412722185","doi":"https://doi.org/10.1109/tie.2025.3587123"},"language":"en","primary_location":{"id":"doi:10.1109/tie.2025.3587123","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tie.2025.3587123","pdf_url":null,"source":{"id":"https://openalex.org/S58031724","display_name":"IEEE Transactions on Industrial Electronics","issn_l":"0278-0046","issn":["0278-0046","1557-9948"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Industrial Electronics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000915116","display_name":"Bobo Helian","orcid":"https://orcid.org/0000-0003-2484-5676"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Bobo Helian","raw_affiliation_strings":["Institute of Mobile Machines, Karlsruhe Institute of Technology, Karlsruhe, Germany"],"raw_orcid":"https://orcid.org/0000-0003-2484-5676","affiliations":[{"raw_affiliation_string":"Institute of Mobile Machines, Karlsruhe Institute of Technology, Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Gabriel Schmitt","orcid":"https://orcid.org/0009-0006-6584-7829"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gabriel Schmitt","raw_affiliation_strings":["Institute of Mobile Machines, Karlsruhe Institute of Technology, Karlsruhe, Germany"],"raw_orcid":"https://orcid.org/0009-0006-6584-7829","affiliations":[{"raw_affiliation_string":"Institute of Mobile Machines, Karlsruhe Institute of Technology, Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041083431","display_name":"Meng Yang","orcid":"https://orcid.org/0000-0002-1272-4757"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Yang","raw_affiliation_strings":["School of Mechanical Engineering, Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-1272-4757","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102784295","display_name":"Yongming Bian","orcid":"https://orcid.org/0000-0002-7086-7529"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongming Bian","raw_affiliation_strings":["School of Mechanical Engineering, Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-7086-7529","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066152834","display_name":"Marcus Geimer","orcid":"https://orcid.org/0000-0002-9911-9292"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Marcus Geimer","raw_affiliation_strings":["Institute of Mobile Machines, Karlsruhe Institute of Technology, Karlsruhe, Germany"],"raw_orcid":"https://orcid.org/0000-0002-9911-9292","affiliations":[{"raw_affiliation_string":"Institute of Mobile Machines, Karlsruhe Institute of Technology, Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5000915116"],"corresponding_institution_ids":["https://openalex.org/I102335020"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17143974,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"72","issue":"12","first_page":"14700","last_page":"14711"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11372","display_name":"Hydraulic and Pneumatic Systems","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11372","display_name":"Hydraulic and Pneumatic Systems","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.9689000248908997,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inverted-pendulum","display_name":"Inverted pendulum","score":0.8879846334457397},{"id":"https://openalex.org/keywords/actuator","display_name":"Actuator","score":0.7897641658782959},{"id":"https://openalex.org/keywords/double-inverted-pendulum","display_name":"Double inverted pendulum","score":0.5998942255973816},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.5695342421531677},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5386255979537964},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5182737708091736},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.48676538467407227},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3910098373889923},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.37180885672569275},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.31896913051605225},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.25302988290786743},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.23983150720596313},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.22850602865219116},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.21573743224143982}],"concepts":[{"id":"https://openalex.org/C192921069","wikidata":"https://www.wikidata.org/wiki/Q550134","display_name":"Inverted pendulum","level":3,"score":0.8879846334457397},{"id":"https://openalex.org/C172707124","wikidata":"https://www.wikidata.org/wiki/Q423488","display_name":"Actuator","level":2,"score":0.7897641658782959},{"id":"https://openalex.org/C102540577","wikidata":"https://www.wikidata.org/wiki/Q5300047","display_name":"Double inverted pendulum","level":4,"score":0.5998942255973816},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.5695342421531677},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5386255979537964},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5182737708091736},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.48676538467407227},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3910098373889923},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.37180885672569275},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.31896913051605225},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.25302988290786743},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.23983150720596313},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.22850602865219116},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.21573743224143982},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tie.2025.3587123","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tie.2025.3587123","pdf_url":null,"source":{"id":"https://openalex.org/S58031724","display_name":"IEEE Transactions on Industrial Electronics","issn_l":"0278-0046","issn":["0278-0046","1557-9948"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Industrial Electronics","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.6700000166893005,"id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G1381731577","display_name":null,"funder_award_id":"52205279","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W2026661001","https://openalex.org/W2041521369","https://openalex.org/W2057155285","https://openalex.org/W2146416655","https://openalex.org/W2160989584","https://openalex.org/W2172067033","https://openalex.org/W2577509550","https://openalex.org/W2607112850","https://openalex.org/W2909588145","https://openalex.org/W2921325762","https://openalex.org/W2981623093","https://openalex.org/W3007490974","https://openalex.org/W3008052590","https://openalex.org/W3044529009","https://openalex.org/W4212932854","https://openalex.org/W4246874178","https://openalex.org/W4252374998","https://openalex.org/W4285197906","https://openalex.org/W4311885910","https://openalex.org/W4312644097","https://openalex.org/W4367663453","https://openalex.org/W4367835918","https://openalex.org/W4379881949","https://openalex.org/W4388741154","https://openalex.org/W4398226126"],"related_works":["https://openalex.org/W2041698009","https://openalex.org/W2024927487","https://openalex.org/W1492838287","https://openalex.org/W2034778971","https://openalex.org/W2349578589","https://openalex.org/W2893549521","https://openalex.org/W2204278379","https://openalex.org/W2381121570","https://openalex.org/W2379721524","https://openalex.org/W2341932412"],"abstract_inverted_index":{"Electrohydraulic":[0],"actuators":[1],"(EHAs)":[2],"are":[3],"critical":[4],"in":[5,88,138],"applications":[6],"demanding":[7],"compact":[8],"designs,":[9],"high":[10],"power":[11],"density,":[12],"and":[13,21,46,78,94,114,119,130,144],"precise":[14],"motion":[15,140],"control.":[16,121],"However,":[17],"their":[18],"nonlinear":[19,77],"dynamics":[20],"inherent":[22],"uncertainties":[23],"pose":[24],"considerable":[25],"control":[26,35,118,141],"challenges.":[27],"This":[28,122],"study":[29,123],"develops":[30],"a":[31,47,66,73,101],"reinforcement":[32],"learning":[33],"(RL)-based":[34],"framework,":[36],"integrating":[37],"an":[38],"actor\u2013critic":[39],"algorithm":[40],"[deep":[41],"deterministic":[42],"policy":[43],"gradient":[44],"(DDPG)]":[45],"novel":[48],"reward-shaping":[49],"method":[50],"to":[51,133],"address":[52],"these":[53],"challenges":[54],"without":[55],"requiring":[56],"prior":[57],"expert":[58],"knowledge.":[59],"The":[60],"proposed":[61],"approach":[62],"is":[63],"validated":[64],"on":[65],"heavy-duty":[67],"EHA-driven":[68,98],"inverted":[69],"pendulum":[70],"testbench,":[71],"as":[72,125],"benchmark":[74],"system":[75],"for":[76,142],"unstable":[79],"dynamics.":[80],"Experimental":[81],"results":[82],"demonstrate":[83],"the":[84,90,97,105,112,134],"RL":[85,137],"controller\u2019s":[86],"effectiveness":[87],"achieving":[89],"dual-control":[91],"goal:":[92],"swing-up":[93],"balancing":[95],"of":[96,136],"pendulum.":[99],"Furthermore,":[100],"comparative":[102],"analysis":[103],"with":[104],"classical":[106],"linear":[107],"quadratic":[108],"regulator":[109],"(LQR)":[110],"highlights":[111],"strengths":[113],"limitations":[115],"between":[116],"RL-based":[117],"model-based":[120],"serves":[124],"fundamental":[126],"research,":[127],"offering":[128],"practical":[129],"theoretical":[131],"contributions":[132],"application":[135],"advanced":[139],"EHAs":[143],"other":[145],"complex":[146],"systems.":[147]},"counts_by_year":[],"updated_date":"2025-12-06T23:10:59.065948","created_date":"2025-10-10T00:00:00"}
