{"id":"https://openalex.org/W3202277149","doi":"https://doi.org/10.1109/tro.2022.3232300","title":"Maximum-Entropy Multi-Agent Dynamic Games: Forward and Inverse Solutions","display_name":"Maximum-Entropy Multi-Agent Dynamic Games: Forward and Inverse Solutions","publication_year":2023,"publication_date":"2023-01-19","ids":{"openalex":"https://openalex.org/W3202277149","doi":"https://doi.org/10.1109/tro.2022.3232300","mag":"3202277149"},"language":"en","primary_location":{"id":"doi:10.1109/tro.2022.3232300","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tro.2022.3232300","pdf_url":"https://ieeexplore.ieee.org/ielx7/8860/4359257/10021943.pdf","source":{"id":"https://openalex.org/S144620930","display_name":"IEEE Transactions on Robotics","issn_l":"1552-3098","issn":["1552-3098","1941-0468"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ieeexplore.ieee.org/ielx7/8860/4359257/10021943.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062267932","display_name":"Negar Mehr","orcid":"https://orcid.org/0000-0002-1045-4423"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Negar Mehr","raw_affiliation_strings":["Aerospace Engineering Department, University of Illinois Urbana-Champaign, Urbana, IL, USA"],"affiliations":[{"raw_affiliation_string":"Aerospace Engineering Department, University of Illinois Urbana-Champaign, Urbana, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100350104","display_name":"Mingyu Wang","orcid":"https://orcid.org/0000-0002-0063-7445"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mingyu Wang","raw_affiliation_strings":["Department of Mechanical Engineering, Stanford University, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081923391","display_name":"Maulik Bhatt","orcid":"https://orcid.org/0000-0002-4742-9192"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maulik Bhatt","raw_affiliation_strings":["Department of Aerospace Engineering, University of Illinois Urbana-Champaign, Urbana, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Aerospace Engineering, University of Illinois Urbana-Champaign, Urbana, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081950488","display_name":"Mac Schwager","orcid":"https://orcid.org/0000-0002-7871-3663"},"institutions":[{"id":"https://openalex.org/I13805885","display_name":"Vaughn College of Aeronautics and Technology","ror":"https://ror.org/056e22e24","country_code":"US","type":"education","lineage":["https://openalex.org/I13805885"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mac Schwager","raw_affiliation_strings":["Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I13805885","https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5062267932"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":7.7773,"has_fulltext":true,"cited_by_count":45,"citation_normalized_percentile":{"value":0.97982165,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"39","issue":"3","first_page":"1801","last_page":"1815"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9847000241279602,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10646","display_name":"Experimental Behavioral Economics Studies","score":0.9645000100135803,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5849900245666504},{"id":"https://openalex.org/keywords/rational-agent","display_name":"Rational agent","score":0.5516074299812317},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5447528958320618},{"id":"https://openalex.org/keywords/nash-equilibrium","display_name":"Nash equilibrium","score":0.515559196472168},{"id":"https://openalex.org/keywords/sequential-game","display_name":"Sequential game","score":0.4372013211250305},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.36568406224250793},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3202596604824066},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.27745139598846436},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.11502155661582947}],"concepts":[{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5849900245666504},{"id":"https://openalex.org/C31772880","wikidata":"https://www.wikidata.org/wiki/Q2666479","display_name":"Rational agent","level":2,"score":0.5516074299812317},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5447528958320618},{"id":"https://openalex.org/C46814582","wikidata":"https://www.wikidata.org/wiki/Q23389","display_name":"Nash equilibrium","level":2,"score":0.515559196472168},{"id":"https://openalex.org/C73795354","wikidata":"https://www.wikidata.org/wiki/Q287618","display_name":"Sequential game","level":3,"score":0.4372013211250305},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.36568406224250793},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3202596604824066},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.27745139598846436},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.11502155661582947}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tro.2022.3232300","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tro.2022.3232300","pdf_url":"https://ieeexplore.ieee.org/ielx7/8860/4359257/10021943.pdf","source":{"id":"https://openalex.org/S144620930","display_name":"IEEE Transactions on Robotics","issn_l":"1552-3098","issn":["1552-3098","1941-0468"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Robotics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/tro.2022.3232300","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tro.2022.3232300","pdf_url":"https://ieeexplore.ieee.org/ielx7/8860/4359257/10021943.pdf","source":{"id":"https://openalex.org/S144620930","display_name":"IEEE Transactions on Robotics","issn_l":"1552-3098","issn":["1552-3098","1941-0468"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Robotics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G223589181","display_name":null,"funder_award_id":"N00014-18-1-2830","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G2428326068","display_name":null,"funder_award_id":"ECCS-2145134","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G2637195115","display_name":null,"funder_award_id":"4-18-1-","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G2811237814","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G2976417562","display_name":null,"funder_award_id":"CCF-2211542","funder_id":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka"},{"id":"https://openalex.org/G3296431679","display_name":null,"funder_award_id":"N00014-18-1-2830,","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G4510926165","display_name":"Collaborative Research: CPS: Small: Risk-Aware Planning and Control for Safety-Critical Human-CPS","funder_award_id":"2218759","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5042274488","display_name":null,"funder_award_id":"CNS-2218759","funder_id":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka"},{"id":"https://openalex.org/G5130693409","display_name":null,"funder_award_id":"2145134","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7014191820","display_name":"Collaborative Research: Interaction-aware Planning and Control for Robotic Navigation in the Crowd","funder_award_id":"2211542","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7631143731","display_name":null,"funder_award_id":"N00014-18-1-2830","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8470815717","display_name":null,"funder_award_id":"ECCS-2145134 CAREER Award","funder_id":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8876996369","display_name":null,"funder_award_id":"N00014","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320315934","display_name":"Toyota Research Institute","ror":null},{"id":"https://openalex.org/F4320335353","display_name":"National Science Foundation of Sri Lanka","ror":"https://ror.org/010xaa060"},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"},{"id":"https://openalex.org/F4320337392","display_name":"Division of Electrical, Communications and Cyber Systems","ror":"https://ror.org/01krpsy48"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3202277149.pdf","grobid_xml":"https://content.openalex.org/works/W3202277149.grobid-xml"},"referenced_works_count":84,"referenced_works":["https://openalex.org/W64088143","https://openalex.org/W195033972","https://openalex.org/W1578630563","https://openalex.org/W1595575180","https://openalex.org/W1801976851","https://openalex.org/W1964946446","https://openalex.org/W1965455100","https://openalex.org/W1970916399","https://openalex.org/W1974964983","https://openalex.org/W1999874108","https://openalex.org/W2002373723","https://openalex.org/W2019901401","https://openalex.org/W2037997802","https://openalex.org/W2046210054","https://openalex.org/W2061562262","https://openalex.org/W2098774185","https://openalex.org/W2099111195","https://openalex.org/W2104733512","https://openalex.org/W2117885752","https://openalex.org/W2124394479","https://openalex.org/W2147032798","https://openalex.org/W2148962857","https://openalex.org/W2164429173","https://openalex.org/W2209480589","https://openalex.org/W2210387432","https://openalex.org/W2221312193","https://openalex.org/W2264897026","https://openalex.org/W2290104316","https://openalex.org/W2410842990","https://openalex.org/W2411577903","https://openalex.org/W2594103415","https://openalex.org/W2609650878","https://openalex.org/W2727450595","https://openalex.org/W2737702598","https://openalex.org/W2765116338","https://openalex.org/W2765199760","https://openalex.org/W2799151646","https://openalex.org/W2811409798","https://openalex.org/W2883057932","https://openalex.org/W2946233467","https://openalex.org/W2949561945","https://openalex.org/W2963277051","https://openalex.org/W2963289505","https://openalex.org/W2963368198","https://openalex.org/W2963390138","https://openalex.org/W2963584844","https://openalex.org/W2963590100","https://openalex.org/W2964367126","https://openalex.org/W2980087597","https://openalex.org/W2980903217","https://openalex.org/W2990116160","https://openalex.org/W2996499288","https://openalex.org/W3010842970","https://openalex.org/W3035478219","https://openalex.org/W3045019238","https://openalex.org/W3045870112","https://openalex.org/W3046169940","https://openalex.org/W3089576059","https://openalex.org/W3130217624","https://openalex.org/W3153199159","https://openalex.org/W3159797474","https://openalex.org/W3174761862","https://openalex.org/W4294187414","https://openalex.org/W6607786297","https://openalex.org/W6635451124","https://openalex.org/W6638440308","https://openalex.org/W6674884181","https://openalex.org/W6675999342","https://openalex.org/W6679945570","https://openalex.org/W6681631837","https://openalex.org/W6688456363","https://openalex.org/W6688828641","https://openalex.org/W6696380822","https://openalex.org/W6718092244","https://openalex.org/W6734517396","https://openalex.org/W6736495777","https://openalex.org/W6750186571","https://openalex.org/W6753207554","https://openalex.org/W6763248972","https://openalex.org/W6768870957","https://openalex.org/W6773024798","https://openalex.org/W6773097889","https://openalex.org/W6781737445","https://openalex.org/W6903351479"],"related_works":["https://openalex.org/W2605224496","https://openalex.org/W4312141693","https://openalex.org/W3123463717","https://openalex.org/W123624058","https://openalex.org/W2803144261","https://openalex.org/W1586896826","https://openalex.org/W2069037520","https://openalex.org/W2118082251","https://openalex.org/W2406869706","https://openalex.org/W2162110047"],"abstract_inverted_index":{"In":[0,171],"this":[1],"article,":[2],"we":[3,37,80,120,174],"study":[4],"the":[5,39,66,72,77,92,98,113,117,126,130,167,181],"problem":[6],"of":[7,28,55,129,151,193],"multiple":[8,53,131],"stochastic":[9,29],"agents":[10,54,133,144],"interacting":[11,132],"in":[12,97,146,156],"a":[13,25,49,60,82,157,189],"dynamic":[14],"game":[15,183],"scenario":[16],"with":[17,164,200],"continuous":[18],"state":[19,140],"and":[20,68,139,163],"action":[21],"spaces.":[22],"We":[23,44,63,101],"define":[24],"new":[26],"notion":[27],"Nash":[30],"equilibrium":[31,42],"for":[32,59,71,91,112],"boundedly":[33,136],"rational":[34,137],"agents,":[35,93],"which":[36,94],"call":[38],"entropic":[40],"cost":[41,127],"(ECE).":[43],"show":[45,175],"that":[46],"ECE":[47,74,88,109],"is":[48,154],"natural":[50],"extension":[51],"to":[52,85,106,124],"maximum":[56],"entropy":[57],"optimality":[58],"single":[61],"agent.":[62],"solve":[64],"both":[65,172],"\u201cforward\u201d":[67],"\u201cinverse\u201d":[69],"problems":[70],"multi-agent":[73,159],"game.":[75],"For":[76,116],"forward":[78],"problem,":[79,119],"provide":[81],"Riccati":[83],"algorithm":[84,123],"compute":[86],"closed-form":[87],"feedback":[89,110],"policies":[90,111],"are":[95],"exact":[96],"linear-quadratic-gaussian":[99],"case.":[100,115],"give":[102],"an":[103,122,147],"iterative":[104],"variant":[105],"find":[107],"locally":[108],"nonlinear":[114],"inverse":[118,202],"present":[121],"infer":[125],"functions":[128],"given":[134],"noisy,":[135],"input":[138],"trajectory":[141],"examples":[142],"from":[143,166],"acting":[145],"ECE.":[148],"The":[149],"effectiveness":[150],"our":[152,187],"algorithms":[153],"demonstrated":[155],"simulated":[158],"collision":[160],"avoidance":[161],"scenario,":[162],"data":[165],"INTERACTION":[168],"traffic":[169],"dataset.":[170],"cases,":[173],"that,":[176],"by":[177],"taking":[178],"into":[179],"account":[180],"agents'":[182,194],"theoretic":[184],"interactions":[185],"using":[186],"algorithm,":[188],"more":[190],"accurate":[191],"model":[192],"costs":[195],"can":[196],"be":[197],"learned,":[198],"compared":[199],"standard":[201],"optimal":[203],"control":[204],"methods.":[205]},"counts_by_year":[{"year":2025,"cited_by_count":21},{"year":2024,"cited_by_count":15},{"year":2023,"cited_by_count":9}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
