{"id":"https://openalex.org/W4413393300","doi":"https://doi.org/10.23919/acc63710.2025.11107675","title":"Learning Effective and Generalizable Controller via Zeroth-order Gradient Estimation","display_name":"Learning Effective and Generalizable Controller via Zeroth-order Gradient Estimation","publication_year":2025,"publication_date":"2025-07-08","ids":{"openalex":"https://openalex.org/W4413393300","doi":"https://doi.org/10.23919/acc63710.2025.11107675"},"language":"en","primary_location":{"id":"doi:10.23919/acc63710.2025.11107675","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc63710.2025.11107675","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 American Control Conference (ACC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034632701","display_name":"Chaodong Li","orcid":"https://orcid.org/0000-0003-4714-9569"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chaodong Li","raw_affiliation_strings":["Tongji University,Department of Control Science and Engineering,Shanghai,China,201804"],"affiliations":[{"raw_affiliation_string":"Tongji University,Department of Control Science and Engineering,Shanghai,China,201804","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089663996","display_name":"Peng Yi","orcid":"https://orcid.org/0000-0002-2494-1505"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Yi","raw_affiliation_strings":["Tongji University,Department of Control Science and Engineering,Shanghai,China,201804"],"affiliations":[{"raw_affiliation_string":"Tongji University,Department of Control Science and Engineering,Shanghai,China,201804","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116337554","display_name":"Wenting Liu","orcid":"https://orcid.org/0000-0001-7008-0120"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenting Liu","raw_affiliation_strings":["Tongji University,Department of Control Science and Engineering,Shanghai,China,201804"],"affiliations":[{"raw_affiliation_string":"Tongji University,Department of Control Science and Engineering,Shanghai,China,201804","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025654724","display_name":"Di Zhao","orcid":"https://orcid.org/0000-0003-2508-9163"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Di Zhao","raw_affiliation_strings":["Tongji University,Department of Control Science and Engineering,Shanghai,China,201804"],"affiliations":[{"raw_affiliation_string":"Tongji University,Department of Control Science and Engineering,Shanghai,China,201804","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080997906","display_name":"Wenyan Bai","orcid":"https://orcid.org/0000-0002-3192-3516"},"institutions":[{"id":"https://openalex.org/I4210166468","display_name":"Beijing Aerospace Flight Control Center","ror":"https://ror.org/007a14354","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210166468"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenyan Bai","raw_affiliation_strings":["Beijing Aerospace Automatic Control Institute,Beijing,China,100854"],"affiliations":[{"raw_affiliation_string":"Beijing Aerospace Automatic Control Institute,Beijing,China,100854","institution_ids":["https://openalex.org/I4210166468"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5034632701"],"corresponding_institution_ids":["https://openalex.org/I116953780"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.32274002,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"166","last_page":"173"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9585000276565552,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9585000276565552,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11236","display_name":"Control Systems and Identification","score":0.9323999881744385,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9228000044822693,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5714884400367737},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5593048334121704},{"id":"https://openalex.org/keywords/zeroth-law-of-thermodynamics","display_name":"Zeroth law of thermodynamics","score":0.5355809330940247},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.49312278628349304},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4883882403373718},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.41617390513420105},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.29251575469970703},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.18139317631721497},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.145094633102417},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.1360037922859192}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5714884400367737},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5593048334121704},{"id":"https://openalex.org/C68755742","wikidata":"https://www.wikidata.org/wiki/Q190983","display_name":"Zeroth law of thermodynamics","level":2,"score":0.5355809330940247},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.49312278628349304},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4883882403373718},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.41617390513420105},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29251575469970703},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.18139317631721497},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.145094633102417},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.1360037922859192},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/acc63710.2025.11107675","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc63710.2025.11107675","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 American Control Conference (ACC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1502680304","https://openalex.org/W2009797711","https://openalex.org/W2124289529","https://openalex.org/W2134673975","https://openalex.org/W2889470209","https://openalex.org/W3134723610","https://openalex.org/W3156330606","https://openalex.org/W3185165122","https://openalex.org/W3208705304","https://openalex.org/W4383066094","https://openalex.org/W4389476291","https://openalex.org/W4390938336","https://openalex.org/W4393206865"],"related_works":["https://openalex.org/W2055832495","https://openalex.org/W4297745082","https://openalex.org/W1993876517","https://openalex.org/W1601218205","https://openalex.org/W2793511430","https://openalex.org/W4210561670","https://openalex.org/W2014930628","https://openalex.org/W2007277451","https://openalex.org/W2011273327","https://openalex.org/W1869596295"],"abstract_inverted_index":{"Learning-based":[0],"offline":[1],"training":[2,47,62,97,117,125],"methods":[3],"can":[4],"effectively":[5],"reduce":[6],"the":[7,61,79,89,102,106,130],"computational":[8],"demands":[9],"of":[10],"real-time":[11],"optimization-based":[12],"control.":[13],"However,":[14],"existing":[15],"approaches":[16],"that":[17,71,99],"rely":[18],"on":[19,101],"imitation":[20],"or":[21,31,54],"differentiable":[22,32],"programming":[23],"may":[24],"fail":[25],"if":[26],"a":[27,42,66,74,86,96,111],"well-tuned":[28],"MPC":[29],"controller":[30,81,91,108,151],"plant":[33,113],"dynamics":[34],"are":[35],"unavailable.":[36],"To":[37,59],"address":[38],"this,":[39],"we":[40,64,94,128],"propose":[41,95],"zeroth-order":[43,75],"optimization":[44],"approach":[45],"for":[46,137,165],"neural":[48,90,107],"controllers":[49],"using":[50],"input-output":[51],"prediction":[52],"sequences":[53],"even":[55],"only":[56],"bandit":[57,80],"feedback.":[58],"improve":[60],"efficiency,":[63],"introduce":[65],"mixed":[67],"gradient":[68,76],"computation":[69],"scheme":[70],"first":[72],"applies":[73,85],"estimation":[77],"with":[78,119,143,158],"performance,":[82],"and":[83,110,139,146],"then":[84],"backpropagation":[87],"to":[88,115,169],"network.":[92],"Additionally,":[93],"procedure":[98],"relies":[100],"closed-loop":[103],"interaction":[104],"between":[105],"network":[109],"black-box":[112],"model":[114],"generate":[116],"data":[118],"better":[120],"distribution,":[121],"thereby":[122],"positively":[123],"impacting":[124],"effectiveness.":[126],"Finally,":[127],"evaluate":[129],"proposed":[131],"method":[132],"through":[133],"extensive":[134],"simulation":[135,168],"experiments":[136],"tracking":[138],"stabilization":[140],"control":[141],"tasks":[142],"high-dimensional,":[144],"nonlinear,":[145],"strongly":[147],"coupled":[148],"plants.":[149],"The":[150],"shows":[152],"generalizability":[153],"when":[154],"implemented":[155],"in":[156],"plants":[157],"parameter":[159],"drifts,":[160],"which":[161],"makes":[162],"it":[163],"suitable":[164],"transferring":[166],"from":[167],"real-world":[170],"applications.":[171]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
