{"id":"https://openalex.org/W4399665804","doi":"https://doi.org/10.1109/tase.2024.3412188","title":"Optimal Robust Formation of Multi-Agent Systems as Adversarial Graphical Apprentice Games With Inverse Reinforcement Learning","display_name":"Optimal Robust Formation of Multi-Agent Systems as Adversarial Graphical Apprentice Games With Inverse Reinforcement Learning","publication_year":2024,"publication_date":"2024-06-14","ids":{"openalex":"https://openalex.org/W4399665804","doi":"https://doi.org/10.1109/tase.2024.3412188"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2024.3412188","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3412188","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092254495","display_name":"Fatemeh Mahdavi Golmisheh","orcid":"https://orcid.org/0000-0002-2034-8130"},"institutions":[{"id":"https://openalex.org/I67009956","display_name":"Iran University of Science and Technology","ror":"https://ror.org/01jw2p796","country_code":"IR","type":"education","lineage":["https://openalex.org/I67009956"]}],"countries":["IR"],"is_corresponding":true,"raw_author_name":"Fatemeh Mahdavi Golmisheh","raw_affiliation_strings":["Electrical Engineering Department, Iran University of Science and Technology (IUST), Tehran, Iran"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering Department, Iran University of Science and Technology (IUST), Tehran, Iran","institution_ids":["https://openalex.org/I67009956"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065722336","display_name":"Saeed Shamaghdari","orcid":"https://orcid.org/0000-0002-2014-3098"},"institutions":[{"id":"https://openalex.org/I67009956","display_name":"Iran University of Science and Technology","ror":"https://ror.org/01jw2p796","country_code":"IR","type":"education","lineage":["https://openalex.org/I67009956"]}],"countries":["IR"],"is_corresponding":false,"raw_author_name":"Saeed Shamaghdari","raw_affiliation_strings":["Electrical Engineering Department, Iran University of Science and Technology (IUST), Tehran, Iran"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering Department, Iran University of Science and Technology (IUST), Tehran, Iran","institution_ids":["https://openalex.org/I67009956"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5092254495"],"corresponding_institution_ids":["https://openalex.org/I67009956"],"apc_list":null,"apc_paid":null,"fwci":9.8297,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.97860502,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"22","issue":null,"first_page":"4867","last_page":"4880"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12158","display_name":"Guidance and Control Systems","score":0.6923999786376953,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12158","display_name":"Guidance and Control Systems","score":0.6923999786376953,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14420","display_name":"Advanced Research in Systems and Signal Processing","score":0.6873000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10482","display_name":"Mathematical and Theoretical Epidemiology and Ecology Models","score":0.6690000295639038,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.7879291772842407},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6429219245910645},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5637708306312561},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.5124176144599915},{"id":"https://openalex.org/keywords/inverse","display_name":"Inverse","score":0.5043107271194458},{"id":"https://openalex.org/keywords/apprenticeship","display_name":"Apprenticeship","score":0.4491727352142334},{"id":"https://openalex.org/keywords/inverse-problem","display_name":"Inverse problem","score":0.44259369373321533},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4412643313407898},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4236312806606293},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.37822359800338745},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2647309899330139},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.19345906376838684}],"concepts":[{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.7879291772842407},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6429219245910645},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5637708306312561},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.5124176144599915},{"id":"https://openalex.org/C207467116","wikidata":"https://www.wikidata.org/wiki/Q4385666","display_name":"Inverse","level":2,"score":0.5043107271194458},{"id":"https://openalex.org/C107806365","wikidata":"https://www.wikidata.org/wiki/Q253567","display_name":"Apprenticeship","level":2,"score":0.4491727352142334},{"id":"https://openalex.org/C135252773","wikidata":"https://www.wikidata.org/wiki/Q1567213","display_name":"Inverse problem","level":2,"score":0.44259369373321533},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4412643313407898},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4236312806606293},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.37822359800338745},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2647309899330139},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.19345906376838684},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2024.3412188","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3412188","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W102873864","https://openalex.org/W1614417283","https://openalex.org/W1970148674","https://openalex.org/W1999874108","https://openalex.org/W2027161089","https://openalex.org/W2073668543","https://openalex.org/W2086602679","https://openalex.org/W2092215165","https://openalex.org/W2107396783","https://openalex.org/W2165726932","https://openalex.org/W2347074400","https://openalex.org/W2575417362","https://openalex.org/W2794108217","https://openalex.org/W2811409798","https://openalex.org/W2886235386","https://openalex.org/W2928707119","https://openalex.org/W2943094749","https://openalex.org/W3007973969","https://openalex.org/W3009702296","https://openalex.org/W3037298378","https://openalex.org/W3085531353","https://openalex.org/W3088521775","https://openalex.org/W3122575011","https://openalex.org/W3156476459","https://openalex.org/W3170519291","https://openalex.org/W3186624155","https://openalex.org/W3195322794","https://openalex.org/W3203504876","https://openalex.org/W3205613070","https://openalex.org/W3205647333","https://openalex.org/W4213070435","https://openalex.org/W4287845925","https://openalex.org/W4307234290","https://openalex.org/W4381162568","https://openalex.org/W4381893597","https://openalex.org/W4386276869","https://openalex.org/W6633543754","https://openalex.org/W6634004297","https://openalex.org/W6638440308","https://openalex.org/W6809541652"],"related_works":["https://openalex.org/W2130264791","https://openalex.org/W2502115930","https://openalex.org/W4235622043","https://openalex.org/W2155887593","https://openalex.org/W2102428166","https://openalex.org/W1600547024","https://openalex.org/W3125491562","https://openalex.org/W2239395319","https://openalex.org/W2573907782","https://openalex.org/W2980420562"],"abstract_inverted_index":{"This":[0,43,71,249,262],"paper":[1],"introduces":[2],"a":[3,77,198,291,300],"novel":[4],"approach":[5,21,296],"to":[6,54,206,221,244,258,279],"solving":[7],"robust":[8],"optimal":[9,89,98,129,168,209,223,266,322],"formation":[10,323],"control":[11,90,99,130,169],"problems":[12,324],"in":[13,93,104,126,213,325],"heterogeneous":[14],"multi-agent":[15],"systems":[16],"(MASs)":[17],"with":[18,81,255,284,313],"disturbances.":[19],"Our":[20],"frames":[22],"this":[23,260,316],"problem":[24],"as":[25,68,271,290],"an":[26,37,138,208],"adversarial":[27],"graphical":[28],"apprentice":[29],"game":[30,34],"problem,":[31],"using":[32,109],"the":[33,46,56,88,94,97,105,112,115,119,127,191,194,222,235,239,246,256,265,275,281,285,310],"concept":[35],"and":[36,65,121,152,170,178,180,238,321],"inverse":[38,128],"reinforcement":[39],"learning":[40],"(IRL)":[41],"algorithm.":[42],"work":[44],"innovates":[45],"derivation":[47],"of":[48,84,91,100,118,148,193,200,303],"unknown":[49],"reward":[50,116,155,184,241],"functions":[51,117,156],"through":[52],"demonstrations":[53],"achieve":[55,245],"desired":[57,247,282],"formation.":[58],"In":[59,111],"addition,":[60],"we":[61,136,217,231,277,307],"define":[62],"learner,":[63],"estimator,":[64],"expert":[66,272],"MASs":[67,123],"separate":[69],"entities.":[70],"aim":[72],"is":[73,102,211,228,288,297],"achieved":[74],"by":[75,108],"introducing":[76],"model-based":[78],"IRL":[79,142,165,253],"algorithm":[80,139],"three":[82],"stages":[83],"learning.":[85],"After":[86],"determining":[87],"estimators":[92],"first":[95],"stage,":[96,114],"learners":[101],"found":[103],"second":[106],"stage":[107,132],"them.":[110],"third":[113],"estimator":[120],"learner":[122,149,292,311],"are":[124,186],"updated":[125],"(IOC)":[131],"simultaneously.":[133],"Following":[134],"that,":[135],"present":[137],"for":[140,176,197,269,299],"model-free":[141],"that":[143,182],"does":[144],"not":[145,233],"require":[146],"knowledge":[147],"agents\u2019":[150,236],"dynamics":[151,237],"can":[153],"reconstruct":[154],"after":[157],"observing":[158],"online":[159],"trajectories.":[160],"As":[161],"subproblems,":[162],"both":[163],"proposed":[164,295],"algorithms":[166,196,254],"address":[167],"IOC.":[171],"We":[172],"analyze":[173],"these":[174],"approaches":[175],"stability":[177],"convergence":[179],"demonstrate":[181],"state":[183],"weights":[185],"non-unique.":[187],"Simulation":[188],"results":[189],"show":[190],"effectiveness":[192],"introduced":[195],"group":[199],"unmanned":[201],"aerial":[202],"vehicles":[203],"(UAVs).":[204],"Note":[205],"Practitioners\u2014Designing":[207],"controller":[210],"challenging":[212],"MAS,":[214,276],"especially":[215],"where":[216],"only":[218],"have":[219,308],"access":[220],"reference":[224,267],"path.":[225,248],"The":[226,294],"challenge":[227],"compounded":[229],"if":[230],"do":[232],"know":[234],"appropriate":[240],"function":[242],"needed":[243],"article":[250],"proposes":[251],"two":[252],"motivation":[257],"solve":[259],"problem.":[261],"study":[263],"considers":[264],"path":[268,283],"agents":[270],"MAS.":[273,293],"Also,":[274],"want":[278],"follow":[280],"minor":[286],"error,":[287],"represented":[289],"suitable":[298],"large":[301],"class":[302],"linear":[304],"MAS":[305,312],"since":[306],"modeled":[309],"disturbance.":[314],"Therefore,":[315],"method":[317],"suits":[318],"tracking,":[319],"path-planning,":[320],"MASs.":[326],"It":[327],"requires":[328],"minimal":[329],"information":[330],"but":[331],"yields":[332],"impressive":[333],"results.":[334]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":12}],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
