{"id":"https://openalex.org/W4296474687","doi":"https://doi.org/10.1109/cog51982.2022.9893722","title":"VMAPD: Generate Diverse Solutions for Multi-Agent Games with Recurrent Trajectory Discriminators","display_name":"VMAPD: Generate Diverse Solutions for Multi-Agent Games with Recurrent Trajectory Discriminators","publication_year":2022,"publication_date":"2022-08-21","ids":{"openalex":"https://openalex.org/W4296474687","doi":"https://doi.org/10.1109/cog51982.2022.9893722"},"language":"en","primary_location":{"id":"doi:10.1109/cog51982.2022.9893722","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cog51982.2022.9893722","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101984824","display_name":"Shiyu Huang","orcid":"https://orcid.org/0000-0003-0500-0141"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shiyu Huang","raw_affiliation_strings":["Tsinghua University,Beijing,China","Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Beijing,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054149338","display_name":"Chao Yu","orcid":"https://orcid.org/0000-0002-4279-2152"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Yu","raw_affiliation_strings":["Tsinghua University,Beijing,China","Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Beijing,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108156794","display_name":"Bin Wang","orcid":"https://orcid.org/0000-0002-3790-2708"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Wang","raw_affiliation_strings":["Huawei Noah&#x2019;s Ark Lab,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Huawei Noah&#x2019;s Ark Lab,Beijing,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100407362","display_name":"Dong Li","orcid":null},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dong Li","raw_affiliation_strings":["Huawei Noah&#x2019;s Ark Lab,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Huawei Noah&#x2019;s Ark Lab,Beijing,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100445144","display_name":"Yu Wang","orcid":"https://orcid.org/0000-0002-0431-1039"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu Wang","raw_affiliation_strings":["Tsinghua University,Beijing,China","Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Beijing,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100443189","display_name":"Ting Chen","orcid":"https://orcid.org/0000-0002-3228-9166"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ting Chen","raw_affiliation_strings":["Tsinghua University,Beijing,China","Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Beijing,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100606995","display_name":"Jun Zhu","orcid":"https://orcid.org/0000-0002-6254-2388"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Zhu","raw_affiliation_strings":["Tsinghua University,Beijing,China","Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Beijing,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101984824"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.1326,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.52970061,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"575","issue":null,"first_page":"9","last_page":"16"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9789000153541565,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9761999845504761,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.813998818397522},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6665239334106445},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.42778605222702026},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34940093755722046},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.07584121823310852}],"concepts":[{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.813998818397522},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6665239334106445},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.42778605222702026},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34940093755722046},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.07584121823310852},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cog51982.2022.9893722","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cog51982.2022.9893722","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7400000095367432}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322392","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1941248864","https://openalex.org/W2026723619","https://openalex.org/W2068674173","https://openalex.org/W2098774185","https://openalex.org/W2157331557","https://openalex.org/W2747213132","https://openalex.org/W2753738274","https://openalex.org/W2785315072","https://openalex.org/W2785342287","https://openalex.org/W2798391154","https://openalex.org/W2799151646","https://openalex.org/W2904246096","https://openalex.org/W2950397026","https://openalex.org/W2962730405","https://openalex.org/W2962854145","https://openalex.org/W2963438456","https://openalex.org/W2963523627","https://openalex.org/W2963722050","https://openalex.org/W2982316857","https://openalex.org/W2995107092","https://openalex.org/W2995650662","https://openalex.org/W2996037775","https://openalex.org/W3002670059","https://openalex.org/W3034008431","https://openalex.org/W3089778445","https://openalex.org/W3091287254","https://openalex.org/W3098272089","https://openalex.org/W3122690883","https://openalex.org/W3134226813","https://openalex.org/W3137337287","https://openalex.org/W3159637833","https://openalex.org/W4288091739","https://openalex.org/W4288294128","https://openalex.org/W4288594419","https://openalex.org/W4295598622","https://openalex.org/W4299802797","https://openalex.org/W6631190155","https://openalex.org/W6640661648","https://openalex.org/W6674884181","https://openalex.org/W6685757253","https://openalex.org/W6738796088","https://openalex.org/W6747941106","https://openalex.org/W6748566876","https://openalex.org/W6748603076","https://openalex.org/W6749304979","https://openalex.org/W6749821205","https://openalex.org/W6750186571","https://openalex.org/W6751659697","https://openalex.org/W6757592117","https://openalex.org/W6758507868","https://openalex.org/W6758846586","https://openalex.org/W6765407481","https://openalex.org/W6767327128","https://openalex.org/W6771398375","https://openalex.org/W6772005887","https://openalex.org/W6772027365","https://openalex.org/W6779621802","https://openalex.org/W6783196708","https://openalex.org/W6783704099","https://openalex.org/W6783988234","https://openalex.org/W6791474689","https://openalex.org/W6791533262","https://openalex.org/W6791779665"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4323768008","https://openalex.org/W1941703695","https://openalex.org/W4248382324"],"abstract_inverted_index":{"Recent":[0],"algorithms":[1,37],"designed":[2],"for":[3,13,72,76],"multi-agent":[4,65,96,162],"tasks":[5,20],"focus":[6],"on":[7,107,159],"finding":[8],"a":[9,101,131],"single":[10],"optimal":[11,33],"solution":[12],"all":[14,111],"the":[15,90,108,120,138,146,154],"agents.":[16,81,112],"However,":[17],"in":[18],"many":[19,46],"(e.g.,":[21],"matrix":[22],"games":[23],"and":[24,88,95,124],"transportation":[25],"dispatching),":[26],"there":[27],"may":[28],"exist":[29],"more":[30,170],"than":[31],"one":[32,42],"solution,":[34],"while":[35],"previous":[36],"can":[38,125],"only":[39],"converge":[40],"to":[41,52,118,144],"of":[43,79,85,110,156],"them.":[44],"In":[45,59],"practical":[47],"applications,":[48],"it":[49],"is":[50],"important":[51],"develop":[53],"reasonable":[54],"agents":[55,140],"with":[56,172,177],"diverse":[57,74],"behaviors.":[58],"this":[60],"paper,":[61],"we":[62,99],"propose":[63],"\u201dvariational":[64],"policy":[66,116],"diversification\u201d":[67],"(VMAPD),":[68],"an":[69],"on-policy":[70],"framework":[71],"discovering":[73],"policies":[75],"coordination":[77],"patterns":[78],"multiple":[80],"By":[82],"taking":[83],"advantage":[84],"latent":[86],"variables":[87],"exploiting":[89],"connection":[91],"between":[92],"variational":[93],"inference":[94],"reinforcement":[97],"learning,":[98],"derive":[100],"tractable":[102],"evidence":[103],"lower":[104,122],"bound":[105,123],"(ELBO)":[106],"trajectories":[109],"Our":[113],"algorithm":[114,158],"uses":[115],"iteration":[117],"maximize":[119],"derived":[121],"be":[126],"simply":[127],"implemented":[128],"by":[129],"adding":[130],"pseudo":[132,147],"reward":[133,148],"during":[134,149],"centralized":[135],"learning.":[136],"And":[137],"trained":[139],"do":[141],"not":[142],"need":[143],"access":[145],"decentralized":[150],"execution.":[151],"We":[152],"demonstrate":[153],"effectiveness":[155],"our":[157],"several":[160],"popular":[161],"testbeds.":[163],"Experimental":[164],"results":[165],"show":[166],"that":[167],"VMAPD":[168],"finds":[169],"solutions":[171],"similar":[173],"sample":[174],"complexity":[175],"compared":[176],"other":[178],"baselines.":[179]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
