{"id":"https://openalex.org/W4366238939","doi":"https://doi.org/10.1109/tnnls.2023.3262921","title":"Learning Multi-Agent Cooperation via Considering Actions of Teammates","display_name":"Learning Multi-Agent Cooperation via Considering Actions of Teammates","publication_year":2023,"publication_date":"2023-04-18","ids":{"openalex":"https://openalex.org/W4366238939","doi":"https://doi.org/10.1109/tnnls.2023.3262921","pmid":"https://pubmed.ncbi.nlm.nih.gov/37071511"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2023.3262921","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3262921","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031053184","display_name":"Shanqi Liu","orcid":"https://orcid.org/0000-0003-0583-2423"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Shanqi Liu","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100359512","display_name":"Weiwei Liu","orcid":"https://orcid.org/0000-0002-2496-7748"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weiwei Liu","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004120702","display_name":"Wenzhou Chen","orcid":"https://orcid.org/0000-0002-1443-1077"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenzhou Chen","raw_affiliation_strings":["College of Computer Science, Hangzhou Dianzi University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science, Hangzhou Dianzi University, Hangzhou, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014432572","display_name":"Guanzhong Tian","orcid":"https://orcid.org/0000-0002-7292-4056"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanzhong Tian","raw_affiliation_strings":["Ningbo Innovation Center, Zhejiang University, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"Ningbo Innovation Center, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100730479","display_name":"Jun Chen","orcid":"https://orcid.org/0000-0001-6568-8801"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jun Chen","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038569817","display_name":"Yao Tong","orcid":"https://orcid.org/0000-0002-7885-3922"},"institutions":[{"id":"https://openalex.org/I4210132539","display_name":"Northwest Institute of Mechanical and Electrical Engineering","ror":"https://ror.org/03pz37k82","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210132539"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yao Tong","raw_affiliation_strings":["Northwest Institute of Mechanical and Electrical Engineering and the Northwest Electromechanical Engineering Research Institute, Xianyang, China"],"affiliations":[{"raw_affiliation_string":"Northwest Institute of Mechanical and Electrical Engineering and the Northwest Electromechanical Engineering Research Institute, Xianyang, China","institution_ids":["https://openalex.org/I4210132539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056945088","display_name":"Junjie Cao","orcid":"https://orcid.org/0000-0003-0484-8167"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Junjie Cao","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100724297","display_name":"Yong Liu","orcid":"https://orcid.org/0000-0003-4822-8939"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yong Liu","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5031053184"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.3921,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.81665857,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"35","issue":"8","first_page":"11553","last_page":"11564"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6189772486686707},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6151262521743774},{"id":"https://openalex.org/keywords/monotonic-function","display_name":"Monotonic function","score":0.5705381631851196},{"id":"https://openalex.org/keywords/soar","display_name":"Soar","score":0.5664253830909729},{"id":"https://openalex.org/keywords/notation","display_name":"Notation","score":0.5647938847541809},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.46206626296043396},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3642275035381317},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.23496779799461365}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6189772486686707},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6151262521743774},{"id":"https://openalex.org/C72169020","wikidata":"https://www.wikidata.org/wiki/Q194404","display_name":"Monotonic function","level":2,"score":0.5705381631851196},{"id":"https://openalex.org/C17305859","wikidata":"https://www.wikidata.org/wiki/Q382944","display_name":"Soar","level":2,"score":0.5664253830909729},{"id":"https://openalex.org/C45357846","wikidata":"https://www.wikidata.org/wiki/Q2001982","display_name":"Notation","level":2,"score":0.5647938847541809},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.46206626296043396},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3642275035381317},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.23496779799461365},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2023.3262921","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3262921","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:37071511","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37071511","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Partnerships for the goals","score":0.41999998688697815,"id":"https://metadata.un.org/sdg/17"}],"awards":[{"id":"https://openalex.org/G2575069074","display_name":null,"funder_award_id":"62088101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8649216278","display_name":null,"funder_award_id":"U21A20484","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W1606056663","https://openalex.org/W1641379095","https://openalex.org/W2012060729","https://openalex.org/W2012812921","https://openalex.org/W2018375997","https://openalex.org/W2159309155","https://openalex.org/W2292533394","https://openalex.org/W2588790649","https://openalex.org/W2594035753","https://openalex.org/W2617547828","https://openalex.org/W2626637010","https://openalex.org/W2810602713","https://openalex.org/W2918867912","https://openalex.org/W2963296584","https://openalex.org/W2963658727","https://openalex.org/W2963934958","https://openalex.org/W2995937146","https://openalex.org/W2996784529","https://openalex.org/W3036329728","https://openalex.org/W3046288222","https://openalex.org/W3089778445","https://openalex.org/W3093143205","https://openalex.org/W3099518626","https://openalex.org/W3175698408","https://openalex.org/W3196869853","https://openalex.org/W4200629404","https://openalex.org/W4212814156","https://openalex.org/W4288091739","https://openalex.org/W4288594419","https://openalex.org/W4299802797","https://openalex.org/W6679395995","https://openalex.org/W6680628479","https://openalex.org/W6738796088","https://openalex.org/W6739516088","https://openalex.org/W6748554570","https://openalex.org/W6749304979","https://openalex.org/W6755069753","https://openalex.org/W6758846586","https://openalex.org/W6762491519","https://openalex.org/W6767327128","https://openalex.org/W6768539364","https://openalex.org/W6775529125","https://openalex.org/W6781750019","https://openalex.org/W6783196708","https://openalex.org/W6784121806","https://openalex.org/W6784745743","https://openalex.org/W6797064975","https://openalex.org/W6805193650","https://openalex.org/W7025312208"],"related_works":["https://openalex.org/W1972687012","https://openalex.org/W2163445345","https://openalex.org/W4250121399","https://openalex.org/W2506478959","https://openalex.org/W2583284593","https://openalex.org/W39838470","https://openalex.org/W1578440997","https://openalex.org/W1540770276","https://openalex.org/W4242275050","https://openalex.org/W4246056463"],"abstract_inverted_index":{"Recently":[0],"value-based":[1],"centralized":[2],"training":[3],"with":[4,91],"decentralized":[5],"execution":[6],"(CTDE)":[7],"multi-agent":[8],"reinforcement":[9],"learning":[10],"(MARL)":[11],"methods":[12,48],"have":[13],"achieved":[14],"excellent":[15],"performance":[16,177],"in":[17,121,126,179],"cooperative":[18],"tasks.":[19],"However,":[20],"the":[21,32,80,97,102,127,189],"most":[22],"representative":[23],"method":[24,110,136,174],"among":[25],"these":[26],"methods,":[27],"Q-network":[28],"MIXing":[29],"(QMIX),":[30],"restricts":[31],"joint":[33],"action":[34,108],"Q":[35,74],"values":[36,75],"to":[37,51,95,139,152,164],"be":[38],"a":[39,72,106,157],"monotonic":[40,182],"mixing":[41],"of":[42,82,129],"each":[43],"agent's":[44],"utilities.":[45],"Furthermore,":[46,145],"current":[47],"cannot":[49],"generalize":[50],"unseen":[52],"environments":[53],"or":[54,124],"different":[55],"agent":[56,84],"configurations,":[57],"which":[58],"is":[59,116],"known":[60],"as":[61],"ad":[62,140,190],"hoc":[63,141,191],"team":[64,142,192],"play":[65,143,193],"situation.":[66,144],"In":[67,132],"this":[68,133],"work,":[69],"we":[70,104,146],"propose":[71,105],"novel":[73],"decomposition":[76],"that":[77,111,172],"considers":[78],"both":[79,180],"return":[81],"an":[83,148],"acting":[85],"on":[86,101],"its":[87],"own":[88],"and":[89,115,156,183,186],"cooperating":[90],"other":[92],"observable":[93,122],"agents":[94,123],"address":[96],"nonmonotonic":[98,184],"problem.":[99],"Based":[100],"decomposition,":[103],"greedy":[107],"searching":[109],"can":[112,137,187],"improve":[113],"exploration":[114],"not":[117],"affected":[118],"by":[119],"changes":[120,125],"order":[128],"agents'":[130],"actions.":[131],"way,":[134],"our":[135,173],"adapt":[138],"utilize":[147],"auxiliary":[149],"loss":[150],"related":[151],"environmental":[153],"cognition":[154],"consistency":[155],"modified":[158],"prioritized":[159],"experience":[160],"replay":[161],"(PER)":[162],"buffer":[163],"assist":[165],"training.":[166],"Our":[167],"extensive":[168],"experimental":[169],"results":[170],"show":[171],"achieves":[175],"significant":[176],"improvements":[178],"challenging":[181],"domains,":[185],"handle":[188],"situation":[194],"perfectly.":[195]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
