{"id":"https://openalex.org/W4400877505","doi":"https://doi.org/10.1109/tase.2024.3427657","title":"Model-Free Inverse H-Infinity Control for Imitation Learning","display_name":"Model-Free Inverse H-Infinity Control for Imitation Learning","publication_year":2024,"publication_date":"2024-07-22","ids":{"openalex":"https://openalex.org/W4400877505","doi":"https://doi.org/10.1109/tase.2024.3427657"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2024.3427657","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3427657","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102973745","display_name":"Wenqian Xue","orcid":"https://orcid.org/0000-0002-3670-3854"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Wenqian Xue","raw_affiliation_strings":["Electrical and Computer Engineering Department, University of Florida, Gainesville, FL, USA"],"affiliations":[{"raw_affiliation_string":"Electrical and Computer Engineering Department, University of Florida, Gainesville, FL, USA","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001862814","display_name":"Bosen Lian","orcid":"https://orcid.org/0000-0002-3275-9551"},"institutions":[{"id":"https://openalex.org/I82497590","display_name":"Auburn University","ror":"https://ror.org/02v80fc35","country_code":"US","type":"education","lineage":["https://openalex.org/I82497590"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bosen Lian","raw_affiliation_strings":["Electrical and Computer Engineering Department, Auburn University, Auburn, AL, USA"],"affiliations":[{"raw_affiliation_string":"Electrical and Computer Engineering Department, Auburn University, Auburn, AL, USA","institution_ids":["https://openalex.org/I82497590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020552889","display_name":"Yusuf Kartal","orcid":"https://orcid.org/0000-0002-0295-8584"},"institutions":[{"id":"https://openalex.org/I4210147190","display_name":"Turkish Aerospace Industries (Turkey)","ror":"https://ror.org/03jjbp459","country_code":"TR","type":"company","lineage":["https://openalex.org/I4210147190"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Yusuf Kartal","raw_affiliation_strings":["Turkish Aerospace, Kahramankazan/Ankara, T&#x00FC;rkiye"],"affiliations":[{"raw_affiliation_string":"Turkish Aerospace, Kahramankazan/Ankara, T&#x00FC;rkiye","institution_ids":["https://openalex.org/I4210147190"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033960992","display_name":"Jialu Fan","orcid":"https://orcid.org/0000-0001-7585-1166"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jialu Fan","raw_affiliation_strings":["State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042520521","display_name":"Tianyou Chai","orcid":"https://orcid.org/0000-0002-4623-1483"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianyou Chai","raw_affiliation_strings":["State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016137188","display_name":"Frank L. Lewis","orcid":"https://orcid.org/0000-0003-4074-1615"},"institutions":[{"id":"https://openalex.org/I189196454","display_name":"The University of Texas at Arlington","ror":"https://ror.org/019kgqr73","country_code":"US","type":"education","lineage":["https://openalex.org/I189196454"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Frank L. Lewis","raw_affiliation_strings":["The University of Texas at Arlington Research Institute, Fort Worth, TX, USA","The University of Texas, Arlington Research Institute, Fort Worth, TX, USA"],"affiliations":[{"raw_affiliation_string":"The University of Texas at Arlington Research Institute, Fort Worth, TX, USA","institution_ids":["https://openalex.org/I189196454"]},{"raw_affiliation_string":"The University of Texas, Arlington Research Institute, Fort Worth, TX, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5102973745"],"corresponding_institution_ids":["https://openalex.org/I33213144"],"apc_list":null,"apc_paid":null,"fwci":6.1337,"has_fulltext":false,"cited_by_count":19,"citation_normalized_percentile":{"value":0.96963138,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"22","issue":null,"first_page":"5661","last_page":"5672"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11687","display_name":"Teleoperation and Haptic Systems","score":0.9606999754905701,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13644","display_name":"Control Systems in Engineering","score":0.9598000049591064,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/infinity","display_name":"Infinity","score":0.6316999197006226},{"id":"https://openalex.org/keywords/inverse","display_name":"Inverse","score":0.5608381032943726},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.5350353121757507},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4618069529533386},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4400373101234436},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4304538369178772},{"id":"https://openalex.org/keywords/inverse-problem","display_name":"Inverse problem","score":0.4237826466560364},{"id":"https://openalex.org/keywords/inverse-dynamics","display_name":"Inverse dynamics","score":0.41869574785232544},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3943697214126587},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36228325963020325},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3255360424518585},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.2707424759864807},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.19838929176330566},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.19574835896492004},{"id":"https://openalex.org/keywords/classical-mechanics","display_name":"Classical mechanics","score":0.12650352716445923},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.08847862482070923}],"concepts":[{"id":"https://openalex.org/C7321624","wikidata":"https://www.wikidata.org/wiki/Q205","display_name":"Infinity","level":2,"score":0.6316999197006226},{"id":"https://openalex.org/C207467116","wikidata":"https://www.wikidata.org/wiki/Q4385666","display_name":"Inverse","level":2,"score":0.5608381032943726},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.5350353121757507},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4618069529533386},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4400373101234436},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4304538369178772},{"id":"https://openalex.org/C135252773","wikidata":"https://www.wikidata.org/wiki/Q1567213","display_name":"Inverse problem","level":2,"score":0.4237826466560364},{"id":"https://openalex.org/C187523126","wikidata":"https://www.wikidata.org/wiki/Q17098330","display_name":"Inverse dynamics","level":3,"score":0.41869574785232544},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3943697214126587},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36228325963020325},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3255360424518585},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.2707424759864807},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.19838929176330566},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.19574835896492004},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.12650352716445923},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.08847862482070923},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2024.3427657","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3427657","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/2","score":0.5400000214576721,"display_name":"Zero hunger"}],"awards":[{"id":"https://openalex.org/G3239473734","display_name":null,"funder_award_id":"XLYC2007135","funder_id":"https://openalex.org/F4320329895","funder_display_name":"Liaoning Revitalization Talents Program"},{"id":"https://openalex.org/G3316198426","display_name":null,"funder_award_id":"62394342","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3712584777","display_name":null,"funder_award_id":"U22A2049","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5620550699","display_name":null,"funder_award_id":"2023JH26/10200011","funder_id":"https://openalex.org/F4320336742","funder_display_name":"Key Research and Development Program of Liaoning Province"},{"id":"https://openalex.org/G5898287775","display_name":null,"funder_award_id":"61991404","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8752119356","display_name":null,"funder_award_id":"XLYC2007135","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320329895","display_name":"Liaoning Revitalization Talents Program","ror":null},{"id":"https://openalex.org/F4320336742","display_name":"Key Research and Development Program of Liaoning Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W1614417283","https://openalex.org/W1970916399","https://openalex.org/W1986864433","https://openalex.org/W1999874108","https://openalex.org/W2027161089","https://openalex.org/W2037997802","https://openalex.org/W2139416664","https://openalex.org/W2146824685","https://openalex.org/W2148439597","https://openalex.org/W2165726932","https://openalex.org/W2484646121","https://openalex.org/W2498694880","https://openalex.org/W2592261783","https://openalex.org/W2734548765","https://openalex.org/W2762709466","https://openalex.org/W2965243272","https://openalex.org/W2975359243","https://openalex.org/W2978237050","https://openalex.org/W3009702296","https://openalex.org/W3019384758","https://openalex.org/W3037298378","https://openalex.org/W3091079486","https://openalex.org/W3156476459","https://openalex.org/W3170519291","https://openalex.org/W3173566350","https://openalex.org/W3195322794","https://openalex.org/W4205497653","https://openalex.org/W4214584936","https://openalex.org/W4221041364","https://openalex.org/W4282588105","https://openalex.org/W4293194127","https://openalex.org/W4295832240","https://openalex.org/W4301018745","https://openalex.org/W4306910464","https://openalex.org/W4310291816","https://openalex.org/W4381162568","https://openalex.org/W4385833430","https://openalex.org/W4387546286","https://openalex.org/W4388319978","https://openalex.org/W4388579564","https://openalex.org/W6638440308","https://openalex.org/W6640443443","https://openalex.org/W6677631742"],"related_works":["https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2778153218","https://openalex.org/W1531601525","https://openalex.org/W2218699221","https://openalex.org/W2331917905","https://openalex.org/W4285133152","https://openalex.org/W3155039083"],"abstract_inverted_index":{"This":[0,280],"paper":[1,281],"proposes":[2],"a":[3,33,75,95,113,194,212,310,322],"data-driven":[4,330],"model-free":[5,114,257,283],"inverse":[6,15,102,262,284],"reinforcement":[7],"learning":[8],"(IRL)":[9],"algorithm":[10,81,118,165,320],"tailored":[11],"for":[12,123,183,215,274,294],"solving":[13],"an":[14,30,249,277,316,338],"<inline-formula":[16,37,239,265,285],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[17,38,240,266,286],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[18,39,241,267,287],"<tex-math":[19,40,242,268,288],"notation=\"LaTeX\">$H_{\\infty":[20,41,243,269,289],"}":[21,42,244,270,290],"$":[22,43,245,271,291],"</tex-math></inline-formula>":[23,44,246,272,292],"control":[24,45,104,188,247,273,293,341],"problem.":[25],"In":[26,207],"the":[27,50,56,61,88,100,108,121,131,150,155,161,175,180,261,300,304,334],"problem,":[28],"both":[29],"expert":[31,134,296],"and":[32,49,91,99,127,135,145,152,168,197,204,233,331,352],"learner":[34],"engage":[35],"in":[36,200,224],"to":[46,54,148,174,178,230,252,259,325,336],"reject":[47],"disturbances":[48,232],"learner\u2019s":[51],"objective":[52],"is":[53,189,193,211,248,329,344],"imitate":[55],"expert\u2019s":[57,62],"behavior":[58],"by":[59],"reconstructing":[60,216],"performance":[63,92],"function":[64,93,182],"through":[65,166],"IRL":[66,78,117,210,258,306,319],"techniques.":[67],"Introducing":[68],"zero-sum":[69],"game":[70],"principles,":[71],"we":[72,111,138,159],"first":[73],"formulate":[74],"model-based":[76,109],"single-loop":[77,115,318],"policy":[79],"iteration":[80,312],"that":[82,119,308],"includes":[83],"three":[84],"key":[85],"steps:":[86],"updating":[87],"policy,":[89,342],"action,":[90],"using":[94],"new":[96,323],"correction":[97],"formula":[98],"standard":[101],"optimal":[103,184],"principles.":[105],"Building":[106],"upon":[107],"approach,":[110],"propose":[112,315],"off-policy":[116],"eliminates":[120],"need":[122,335],"initial":[124,339],"stabilizing":[125,340],"policies":[126],"prior":[128],"knowledge":[129],"of":[130,133,142,154,163,264,303],"dynamics":[132],"learner.":[136],"Also,":[137],"provide":[139],"rigorous":[140],"proof":[141],"convergence,":[143,350],"stability,":[144,351],"Nash":[146],"optimality":[147,353],"guarantee":[149],"effectiveness":[151],"reliability":[153],"proposed":[156],"algorithms.":[157],"Furthermore,":[158],"showcase":[160],"efficiency":[162],"our":[164],"simulations":[167],"experiments,":[169],"highlighting":[170],"its":[171],"advantages":[172],"compared":[173],"existing":[176,305],"methods.Note":[177],"Practitioners\u2014Generally,":[179],"cost":[181,218],"tracking":[185,202],"or":[186],"imitation":[187,275],"manually":[190],"defined,":[191],"which":[192,343],"challenging":[195],"task":[196],"may":[198],"result":[199],"large":[201],"errors":[203],"slow":[205],"tracking.":[206],"such":[208],"cases,":[209,226],"powerful":[213],"tool":[214],"proper":[217],"functions.":[219],"Real-world":[220],"systems,":[221],"as":[222],"demonstrated":[223],"practical":[225],"are":[227],"frequently":[228],"exposed":[229],"external":[231],"come":[234],"with":[235,321,354],"unknown":[236],"models.":[237],"Employing":[238],"effective":[250],"strategy":[251],"handle":[253],"disturbances.":[254],"However,":[255],"applying":[256],"solve":[260],"problem":[263],"remains":[276],"underexplored":[278],"domain.":[279],"explores":[282],"imitating":[295],"behaviors,":[297],"specifically":[298],"addressing":[299],"time-consuming":[301],"nature":[302],"studies":[307],"employ":[309],"two-loop":[311],"structure.":[313],"We":[314],"efficient":[317],"framework":[324],"do":[326],"this.":[327],"It":[328],"model-free,":[332],"eliminating":[333],"find":[337],"typically":[345],"challenging.":[346],"Additionally,":[347],"it":[348],"ensures":[349],"provable":[355],"guarantees.":[356]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":17}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
