{"id":"https://openalex.org/W4405787242","doi":"https://doi.org/10.1109/iros58592.2024.10801717","title":"Adaptive Trajectory Database Learning for Nonlinear Control with Hybrid Gradient Optimization","display_name":"Adaptive Trajectory Database Learning for Nonlinear Control with Hybrid Gradient Optimization","publication_year":2024,"publication_date":"2024-10-14","ids":{"openalex":"https://openalex.org/W4405787242","doi":"https://doi.org/10.1109/iros58592.2024.10801717"},"language":"en","primary_location":{"id":"doi:10.1109/iros58592.2024.10801717","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801717","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108819707","display_name":"Kuan-Yu Tseng","orcid":"https://orcid.org/0009-0004-4396-6056"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kuan-Yu Tseng","raw_affiliation_strings":["University of Illinois at Urbana&#x2013;Champaign,Department of Mechanical Science and Engineering,Urbana,IL,USA,61801"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana&#x2013;Champaign,Department of Mechanical Science and Engineering,Urbana,IL,USA,61801","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065273077","display_name":"Mengchao Zhang","orcid":"https://orcid.org/0000-0003-4417-7775"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mengchao Zhang","raw_affiliation_strings":["University of Illinois at Urbana&#x2013;Champaign,Department of Mechanical Science and Engineering,Urbana,IL,USA,61801"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana&#x2013;Champaign,Department of Mechanical Science and Engineering,Urbana,IL,USA,61801","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027878263","display_name":"Kris Hauser","orcid":"https://orcid.org/0000-0002-5207-1527"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kris Hauser","raw_affiliation_strings":["University of Illinois at Urbana-Champaign,Department of Computer Science,Urbana,IL,USA,61801"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign,Department of Computer Science,Urbana,IL,USA,61801","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061952552","display_name":"Geir E. Dullerud","orcid":"https://orcid.org/0000-0003-0596-6050"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Geir E. Dullerud","raw_affiliation_strings":["University of Illinois at Urbana&#x2013;Champaign,Department of Mechanical Science and Engineering,Urbana,IL,USA,61801"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana&#x2013;Champaign,Department of Mechanical Science and Engineering,Urbana,IL,USA,61801","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5108819707"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":0.3488,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.63510186,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"11969","last_page":"11976"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9822999835014343,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9822999835014343,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9810000061988831,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10040","display_name":"Adaptive Control of Nonlinear Systems","score":0.970300018787384,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.7220889329910278},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6822862029075623},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.5859419703483582},{"id":"https://openalex.org/keywords/adaptive-control","display_name":"Adaptive control","score":0.5155196189880371},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.48815256357192993},{"id":"https://openalex.org/keywords/trajectory-optimization","display_name":"Trajectory optimization","score":0.4348348379135132},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3732123374938965},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3352607488632202},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.09937286376953125}],"concepts":[{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.7220889329910278},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6822862029075623},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.5859419703483582},{"id":"https://openalex.org/C107464732","wikidata":"https://www.wikidata.org/wiki/Q235781","display_name":"Adaptive control","level":3,"score":0.5155196189880371},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.48815256357192993},{"id":"https://openalex.org/C173246807","wikidata":"https://www.wikidata.org/wiki/Q7833062","display_name":"Trajectory optimization","level":3,"score":0.4348348379135132},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3732123374938965},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3352607488632202},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09937286376953125},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros58592.2024.10801717","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801717","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1591375184","https://openalex.org/W2000803795","https://openalex.org/W2041242313","https://openalex.org/W2560647685","https://openalex.org/W2605102758","https://openalex.org/W2619551236","https://openalex.org/W2767050701","https://openalex.org/W2911087563","https://openalex.org/W2963614114","https://openalex.org/W2968116426","https://openalex.org/W2973229164","https://openalex.org/W2989394062","https://openalex.org/W2998974207","https://openalex.org/W3015222299","https://openalex.org/W3088310808","https://openalex.org/W3205950063","https://openalex.org/W3206938627","https://openalex.org/W4210880854","https://openalex.org/W4295855158","https://openalex.org/W6728925229","https://openalex.org/W6741002519","https://openalex.org/W6746684068","https://openalex.org/W6747473740","https://openalex.org/W6797024940","https://openalex.org/W6804601995"],"related_works":["https://openalex.org/W4385832323","https://openalex.org/W4244391535","https://openalex.org/W2356996864","https://openalex.org/W2904060783","https://openalex.org/W2015393961","https://openalex.org/W2378339670","https://openalex.org/W2359353485","https://openalex.org/W2361427670","https://openalex.org/W2139910871","https://openalex.org/W2119925415"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,29,37,66,104,109,126,134,157],"novel":[4],"experience-based":[5],"technique,":[6,70],"called":[7],"EHGO,":[8],"for":[9,26],"sample-efficient":[10],"adaptive":[11],"control":[12,86],"of":[13,19,40,93,137,201,203,210],"nonlinear":[14],"systems":[15,170],"in":[16,58,103,107,141],"the":[17,47,59,80,85,94,176,186],"presence":[18],"dynamical":[20,169],"modeling":[21],"errors.":[22,191],"The":[23,62,144],"starting":[24],"point":[25],"EHGO":[27,195],"is":[28,146],"database":[30,127,145],"seeded":[31],"with":[32],"many":[33],"trajectories":[34,51,75],"optimized":[35],"under":[36],"reference":[38,60,81,187],"estimate":[39],"real":[41,48,95,204],"system":[42],"dynamics.":[43,61],"When":[44],"executed":[45,74],"on":[46,167],"system,":[49],"these":[50,193],"will":[52],"be":[53,208],"suboptimal":[54],"due":[55],"to":[56,83,124,128,131,148,161,181],"errors":[57],"approach":[63,178],"then":[64],"leverages":[65],"hybrid":[67],"gradient":[68],"optimization":[69],"GRILC,":[71],"which":[72,108,206],"observes":[73],"and":[76,154],"computes":[77],"gradients":[78],"from":[79,114],"model":[82,92,188],"refine":[84],"policy":[87],"without":[88],"requiring":[89],"an":[90],"explicit":[91],"system.":[96],"In":[97,118,192],"past":[98],"work,":[99],"GRILC":[100,130],"was":[101],"applied":[102],"restrictive":[105],"setting":[106],"robot":[110],"executes":[111],"multiple":[112],"rollouts":[113],"identical":[115],"start":[116,139,151],"states.":[117],"this":[119],"paper,":[120],"we":[121],"show":[122,174],"how":[123],"leverage":[125],"enable":[129],"operate":[132],"across":[133],"wide":[135],"envelope":[136],"possible":[138],"states":[140],"different":[142],"iterations.":[143],"used":[147],"balance":[149],"between":[150],"state":[152],"proximity":[153],"recentness-of-experience":[155],"via":[156],"learned":[158],"distance":[159],"metric":[160],"generate":[162],"good":[163],"initial":[164],"guesses.":[165],"Experiments":[166],"three":[168],"(pendulum,":[171],"car,":[172],"drone)":[173],"that":[175],"proposed":[177],"adapts":[179],"quickly":[180],"online":[182],"experience":[183],"even":[184],"when":[185],"has":[189],"significant":[190],"examples":[194],"generates":[196],"near-optimal":[197],"solutions":[198],"within":[199],"hundreds":[200],"epochs":[202],"execution,":[205],"can":[207],"orders":[209],"magnitude":[211],"more":[212],"sample":[213],"efficient":[214],"than":[215],"reinforcement":[216],"learning":[217],"techniques.":[218]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
