{"id":"https://openalex.org/W4312684648","doi":"https://doi.org/10.1109/ijcnn55064.2022.9892225","title":"RACA: Relation-Aware Credit Assignment for Ad-Hoc Cooperation in Multi-Agent Deep Reinforcement Learning","display_name":"RACA: Relation-Aware Credit Assignment for Ad-Hoc Cooperation in Multi-Agent Deep Reinforcement Learning","publication_year":2022,"publication_date":"2022-07-18","ids":{"openalex":"https://openalex.org/W4312684648","doi":"https://doi.org/10.1109/ijcnn55064.2022.9892225"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn55064.2022.9892225","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn55064.2022.9892225","pdf_url":null,"source":{"id":"https://openalex.org/S4363607707","display_name":"2022 International Joint Conference on Neural Networks (IJCNN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100353673","display_name":"Hao Chen","orcid":"https://orcid.org/0009-0001-6480-7976"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hao Chen","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Artificial Intelligence","School of Artificial Intelligence, University of Chinese Academy of Sciences","CRISE, Institute of Automation, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Artificial Intelligence","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"CRISE, Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041120260","display_name":"Guangkai Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guangkai Yang","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Artificial Intelligence","CRISE, Institute of Automation, Chinese Academy of Sciences","School of Artificial Intelligence, University of Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Artificial Intelligence","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"CRISE, Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109012644","display_name":"Junge Zhang","orcid":"https://orcid.org/0000-0002-9970-394X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junge Zhang","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Artificial Intelligence","CRISE, Institute of Automation, Chinese Academy of Sciences","School of Artificial Intelligence, University of Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Artificial Intelligence","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"CRISE, Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083652259","display_name":"Qiyue Yin","orcid":"https://orcid.org/0000-0002-3442-6275"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiyue Yin","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Artificial Intelligence","CRISE, Institute of Automation, Chinese Academy of Sciences","School of Artificial Intelligence, University of Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Artificial Intelligence","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"CRISE, Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028693655","display_name":"Kaiqi Huang","orcid":"https://orcid.org/0000-0002-2677-9273"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210097554","display_name":"Center for Excellence in Brain Science and Intelligence Technology","ror":"https://ror.org/00vpwhm04","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210097554"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaiqi Huang","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Artificial Intelligence","School of Artificial Intelligence, University of Chinese Academy of Sciences","CRISE, Institute of Automation, Chinese Academy of Sciences","CAS Center for Excellence in Brain Science and Intelligence Technology, Beijing, P.R.China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Artificial Intelligence","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"CRISE, Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"CAS Center for Excellence in Brain Science and Intelligence Technology, Beijing, P.R.China","institution_ids":["https://openalex.org/I4210097554"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100353673"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.2078,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.43896789,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9624999761581421,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9502000212669373,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8138007521629333},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7162017226219177},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.47817593812942505},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4732542634010315},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4605405032634735},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4334624111652374},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.412087619304657},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.40148407220840454},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3407632112503052},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.1408196985721588}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8138007521629333},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7162017226219177},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.47817593812942505},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4732542634010315},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4605405032634735},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4334624111652374},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.412087619304657},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.40148407220840454},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3407632112503052},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.1408196985721588},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn55064.2022.9892225","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn55064.2022.9892225","pdf_url":null,"source":{"id":"https://openalex.org/S4363607707","display_name":"2022 International Joint Conference on Neural Networks (IJCNN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals","score":0.44999998807907104}],"awards":[{"id":"https://openalex.org/G852446924","display_name":null,"funder_award_id":"61876181","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":69,"referenced_works":["https://openalex.org/W26302103","https://openalex.org/W1606056663","https://openalex.org/W1657704689","https://openalex.org/W2026662445","https://openalex.org/W2121092017","https://openalex.org/W2136418668","https://openalex.org/W2139993574","https://openalex.org/W2141088582","https://openalex.org/W2145339207","https://openalex.org/W2146544759","https://openalex.org/W2617547828","https://openalex.org/W2747213132","https://openalex.org/W2751808960","https://openalex.org/W2804057010","https://openalex.org/W2807741983","https://openalex.org/W2903871660","https://openalex.org/W2904455790","https://openalex.org/W2949963774","https://openalex.org/W2964015378","https://openalex.org/W2971598376","https://openalex.org/W2995937146","https://openalex.org/W2996786181","https://openalex.org/W2998367975","https://openalex.org/W3012934742","https://openalex.org/W3014503118","https://openalex.org/W3021603984","https://openalex.org/W3032554070","https://openalex.org/W3034971464","https://openalex.org/W3035569762","https://openalex.org/W3046288222","https://openalex.org/W3093143205","https://openalex.org/W3132337045","https://openalex.org/W3170717711","https://openalex.org/W3192797213","https://openalex.org/W3199614200","https://openalex.org/W4226323298","https://openalex.org/W4287755265","https://openalex.org/W4288594419","https://openalex.org/W4294558607","https://openalex.org/W4295598622","https://openalex.org/W4297733535","https://openalex.org/W4299802797","https://openalex.org/W6601057158","https://openalex.org/W6677939520","https://openalex.org/W6679938814","https://openalex.org/W6680600882","https://openalex.org/W6680628479","https://openalex.org/W6726873649","https://openalex.org/W6738796088","https://openalex.org/W6738964360","https://openalex.org/W6743410771","https://openalex.org/W6745537798","https://openalex.org/W6749304979","https://openalex.org/W6752110883","https://openalex.org/W6752380930","https://openalex.org/W6758846586","https://openalex.org/W6762491519","https://openalex.org/W6768539364","https://openalex.org/W6770566355","https://openalex.org/W6771904302","https://openalex.org/W6775529125","https://openalex.org/W6775715841","https://openalex.org/W6776835688","https://openalex.org/W6779109570","https://openalex.org/W6781750019","https://openalex.org/W6784152626","https://openalex.org/W6784745743","https://openalex.org/W6792529980","https://openalex.org/W6810655720"],"related_works":["https://openalex.org/W2468279273","https://openalex.org/W2354198838","https://openalex.org/W1989130879","https://openalex.org/W2103419012","https://openalex.org/W2378211422","https://openalex.org/W2988126442","https://openalex.org/W4321353415","https://openalex.org/W2745001401","https://openalex.org/W1974414866","https://openalex.org/W2130974462"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"reinforcement":[3],"learning":[4],"has":[5],"faced":[6],"several":[7],"challenges":[8],"in":[9,101],"the":[10,15,29,34,71,115,152],"multi-agent":[11],"domain,":[12],"such":[13],"as":[14,23],"credit":[16,30],"assignment":[17,31],"issue.":[18],"Value":[19],"function":[20,45],"factorization":[21,46],"emerges":[22],"a":[24,89,109,138],"promising":[25],"way":[26],"to":[27,56,78,113,131],"handle":[28],"issue":[32],"under":[33],"centralized":[35],"training":[36],"with":[37,50,137],"decentralized":[38],"execution":[39],"(CTDE)":[40],"paradigm.":[41],"However,":[42],"existing":[43],"value":[44],"methods":[47,66,150],"cannot":[48,76],"deal":[49],"ad-hoc":[51,102,157],"cooperation,":[52],"that":[53,128,145],"is,":[54],"adapting":[55],"new":[57],"configurations":[58],"of":[59,81,108,135,141],"teammates":[60,136],"at":[61],"test":[62],"time.":[63],"Specifically,":[64],"these":[65,85],"do":[67],"not":[68],"explicitly":[69],"utilize":[70],"relationship":[72],"between":[73,118],"agents":[74],"and":[75,156],"adapt":[77],"different":[79],"sizes":[80],"inputs.":[82],"To":[83],"address":[84],"limitations,":[86],"we":[87],"propose":[88],"novel":[90],"method,":[91],"called":[92],"Relation-Aware":[93],"Credit":[94],"Assignment":[95],"(RACA),":[96],"which":[97],"achieves":[98],"zero-shot":[99],"generalization":[100],"cooperation":[103,158],"scenarios.":[104,159],"RACA":[105,121],"takes":[106],"advantage":[107],"graph-based":[110],"relation":[111],"encoder":[112],"encode":[114],"topological":[116],"structure":[117],"agents.":[119],"Furthermore,":[120],"utilizes":[122],"an":[123,132],"attention-based":[124],"observation":[125],"abstraction":[126],"mechanism":[127],"can":[129],"generalize":[130],"arbitrary":[133],"number":[134,140],"fixed":[139],"parameters.":[142],"Experiments":[143],"demonstrate":[144],"our":[146],"method":[147],"outperforms":[148],"baseline":[149],"on":[151],"StarCraftII":[153],"micromanagement":[154],"benchmark":[155]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
