{"id":"https://openalex.org/W4391308420","doi":"https://doi.org/10.1109/smc53992.2023.10394648","title":"ReACT: Reinforcement Learning for Controller Parametrization Using B-Spline Geometries","display_name":"ReACT: Reinforcement Learning for Controller Parametrization Using B-Spline Geometries","publication_year":2023,"publication_date":"2023-10-01","ids":{"openalex":"https://openalex.org/W4391308420","doi":"https://doi.org/10.1109/smc53992.2023.10394648"},"language":"en","primary_location":{"id":"doi:10.1109/smc53992.2023.10394648","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc53992.2023.10394648","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024092512","display_name":"Thomas Rudolf","orcid":"https://orcid.org/0000-0002-6020-2611"},"institutions":[{"id":"https://openalex.org/I143379178","display_name":"FZI Research Center for Information Technology","ror":"https://ror.org/04kdh6x72","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I143379178"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Thomas Rudolf","raw_affiliation_strings":["FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131","institution_ids":["https://openalex.org/I143379178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056681387","display_name":"Daniel Fl\u00f6gel","orcid":"https://orcid.org/0009-0005-9899-0616"},"institutions":[{"id":"https://openalex.org/I143379178","display_name":"FZI Research Center for Information Technology","ror":"https://ror.org/04kdh6x72","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I143379178"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Daniel Fl\u00f6gel","raw_affiliation_strings":["FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131","institution_ids":["https://openalex.org/I143379178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019107231","display_name":"Tobias Sch\u00fcrmann","orcid":"https://orcid.org/0000-0002-1967-7076"},"institutions":[{"id":"https://openalex.org/I143379178","display_name":"FZI Research Center for Information Technology","ror":"https://ror.org/04kdh6x72","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I143379178"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tobias Sch\u00fcrmann","raw_affiliation_strings":["FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131","institution_ids":["https://openalex.org/I143379178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093711469","display_name":"Simon S\u00fc\u00df","orcid":null},"institutions":[{"id":"https://openalex.org/I143379178","display_name":"FZI Research Center for Information Technology","ror":"https://ror.org/04kdh6x72","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I143379178"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Simon S\u00fc\u00df","raw_affiliation_strings":["FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131","institution_ids":["https://openalex.org/I143379178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090909486","display_name":"Stefan Schwab","orcid":"https://orcid.org/0000-0002-2646-7755"},"institutions":[{"id":"https://openalex.org/I143379178","display_name":"FZI Research Center for Information Technology","ror":"https://ror.org/04kdh6x72","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I143379178"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Stefan Schwab","raw_affiliation_strings":["FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"FZI Research Center for Information Technology,Embedded Systems and Sensors Engineering department,Karlsruhe,Germany,76131","institution_ids":["https://openalex.org/I143379178"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040502908","display_name":"S\u00f6ren Hohmann","orcid":"https://orcid.org/0000-0002-4170-1431"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"S\u00f6ren Hohmann","raw_affiliation_strings":["Institute of Control Systems of the Karlsruhe Institute of Technology,Karlsruhe,Germany,76131"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Control Systems of the Karlsruhe Institute of Technology,Karlsruhe,Germany,76131","institution_ids":["https://openalex.org/I102335020"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3107,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.56484234,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"3385","last_page":"3391"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14083","display_name":"Extremum Seeking Control Systems","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6735451221466064},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6654156446456909},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5310611724853516},{"id":"https://openalex.org/keywords/parametrization","display_name":"Parametrization (atmospheric modeling)","score":0.48116931319236755},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.4010918140411377},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3858891427516937},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.37701213359832764},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.15120837092399597},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.146755188703537}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6735451221466064},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6654156446456909},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5310611724853516},{"id":"https://openalex.org/C202887219","wikidata":"https://www.wikidata.org/wiki/Q3895221","display_name":"Parametrization (atmospheric modeling)","level":3,"score":0.48116931319236755},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4010918140411377},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3858891427516937},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.37701213359832764},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.15120837092399597},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.146755188703537},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C74902906","wikidata":"https://www.wikidata.org/wiki/Q1190858","display_name":"Radiative transfer","level":2,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/smc53992.2023.10394648","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc53992.2023.10394648","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1534177433","https://openalex.org/W1587477963","https://openalex.org/W2038730444","https://openalex.org/W2893573014","https://openalex.org/W2913668833","https://openalex.org/W2982381122","https://openalex.org/W3006583102","https://openalex.org/W3200445772","https://openalex.org/W3216772467","https://openalex.org/W4220737776","https://openalex.org/W4221155677","https://openalex.org/W4296167810","https://openalex.org/W4310969904","https://openalex.org/W6747473740","https://openalex.org/W6776730770","https://openalex.org/W6802202268","https://openalex.org/W6804601995"],"related_works":["https://openalex.org/W2153421756","https://openalex.org/W2054489697","https://openalex.org/W2077818434","https://openalex.org/W2361081803","https://openalex.org/W2036241269","https://openalex.org/W2109057766","https://openalex.org/W4250375811","https://openalex.org/W2078644396","https://openalex.org/W2026930022","https://openalex.org/W2000675896"],"abstract_inverted_index":{"Robust":[0],"and":[1,15,20,139,179,195,199],"performant":[2],"controllers":[3],"are":[4,71,161],"essential":[5],"for":[6,13],"industrial":[7,210],"applications.":[8],"However,":[9],"deriving":[10],"controller":[11,25,86,111,126],"parameters":[12,127],"complex":[14,56],"nonlinear":[16],"systems":[17,54],"is":[18],"challenging":[19],"time-consuming.":[21],"To":[22,135,189],"facilitate":[23],"automatic":[24],"parametrization,":[26],"this":[27,65,155],"work":[28,156],"presents":[29],"a":[30,51,141,147],"novel":[31],"approach":[32],"using":[33],"deep":[34],"reinforcement":[35],"learning":[36],"(DRL)":[37],"with":[38,55,213],"N-dimensional":[39],"B-spline":[40],"geometries":[41],"(BSGs).":[42],"We":[43,113],"focus":[44],"on":[45,60,99,131,204],"the":[46,61,84,103,110,115,125,177,183,201,205],"control":[47,69,91,100,211],"of":[48,53,182,208],"parameter-variant":[49],"systems,":[50],"class":[52],"behavior":[57],"which":[58,128,166],"depends":[59],"operating":[62,133],"conditions.":[63,134],"For":[64],"system":[66,101],"class,":[67],"gain-scheduling":[68],"structures":[70],"widely":[72],"used":[73],"in":[74],"applications":[75],"across":[76],"industries":[77],"due":[78],"to":[79,108,123,163,176],"well-known":[80],"design":[81],"principles.":[82],"Facilitating":[83],"expensive":[85],"parametrization":[87,206],"task":[88,207],"regarding":[89],"these":[90],"structures,":[92],"we":[93,145,171,197],"deploy":[94],"an":[95,209],"DRL":[96,202],"agent.":[97],"Based":[98],"observations,":[102],"agent":[104,203],"autonomously":[105],"decides":[106],"how":[107],"adapt":[109],"parameters.":[112],"make":[114],"adaptation":[116],"process":[117],"more":[118],"efficient":[119],"by":[120],"introducing":[121],"BSGs":[122],"map":[124],"may":[129],"depend":[130],"numerous":[132],"preprocess":[136],"time-series":[137],"data":[138],"extract":[140],"fixed-length":[142],"feature":[143],"vector,":[144],"use":[146],"long":[148],"short-term":[149],"memory":[150],"(LSTM)":[151],"neural":[152],"networks.":[153],"Furthermore,":[154],"contributes":[157],"actor":[158,178],"regularizations":[159],"that":[160],"relevant":[162],"real-world":[164],"environments":[165],"differ":[167],"from":[168],"training.":[169],"Accordingly,":[170],"apply":[172],"dropout":[173],"layer":[174],"normalization":[175],"critic":[180,186],"networks":[181],"truncated":[184],"quantile":[185],"(TQC)":[187],"algorithm.":[188],"show":[190],"our":[191],"approach's":[192],"working":[193],"principle":[194],"effectiveness,":[196],"train":[198],"evaluate":[200],"structure":[212],"parameter":[214],"lookup":[215],"tables.":[216]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
