{"id":"https://openalex.org/W4396877652","doi":"https://doi.org/10.1109/tpami.2024.3399936","title":"Interaction Pattern Disentangling for Multi-Agent Reinforcement Learning","display_name":"Interaction Pattern Disentangling for Multi-Agent Reinforcement Learning","publication_year":2024,"publication_date":"2024-05-13","ids":{"openalex":"https://openalex.org/W4396877652","doi":"https://doi.org/10.1109/tpami.2024.3399936","pmid":"https://pubmed.ncbi.nlm.nih.gov/38739512"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2024.3399936","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2024.3399936","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090854835","display_name":"Shunyu Liu","orcid":"https://orcid.org/0000-0003-0584-9129"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shunyu Liu","raw_affiliation_strings":["State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","Hangzhou, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-0584-9129","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"Hangzhou, Hangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047371218","display_name":"Jie Song","orcid":"https://orcid.org/0000-0003-3671-6521"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Song","raw_affiliation_strings":["School of Software Technology, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-3671-6521","affiliations":[{"raw_affiliation_string":"School of Software Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048314356","display_name":"Yihe Zhou","orcid":"https://orcid.org/0009-0004-2595-6743"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yihe Zhou","raw_affiliation_strings":["State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","Hangzhou, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0004-2595-6743","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"Hangzhou, Hangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101968615","display_name":"Na Yu","orcid":"https://orcid.org/0009-0008-5499-5388"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Na Yu","raw_affiliation_strings":["State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","Hangzhou, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0008-5499-5388","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"Hangzhou, Hangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100632847","display_name":"Kaixuan Chen","orcid":"https://orcid.org/0000-0002-2492-5230"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaixuan Chen","raw_affiliation_strings":["State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","Hangzhou, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-2492-5230","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"Hangzhou, Hangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043914348","display_name":"Zunlei Feng","orcid":"https://orcid.org/0000-0001-8640-8434"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zunlei Feng","raw_affiliation_strings":["School of Software Technology, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-8640-8434","affiliations":[{"raw_affiliation_string":"School of Software Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026532752","display_name":"Mingli Song","orcid":"https://orcid.org/0000-0003-2621-6048"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingli Song","raw_affiliation_strings":["State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","Hangzhou, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-2621-6048","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Blockchain and Security, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"Hangzhou, Hangzhou, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5090854835"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":3.7004,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.93504876,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"46","issue":"12","first_page":"8157","last_page":"8172"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.7143999934196472,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.7143999934196472,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6773917078971863},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6361586451530457},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6150919198989868},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38223356008529663},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33034294843673706}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6773917078971863},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6361586451530457},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6150919198989868},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38223356008529663},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33034294843673706}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2024.3399936","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2024.3399936","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:38739512","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38739512","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":73,"referenced_works":["https://openalex.org/W2145339207","https://openalex.org/W2617547828","https://openalex.org/W2747213132","https://openalex.org/W2810602713","https://openalex.org/W2915117209","https://openalex.org/W2964199361","https://openalex.org/W2970777192","https://openalex.org/W2982316857","https://openalex.org/W2997070234","https://openalex.org/W2997502221","https://openalex.org/W2997536466","https://openalex.org/W2997940961","https://openalex.org/W2998367975","https://openalex.org/W3005335721","https://openalex.org/W3030840723","https://openalex.org/W3033672499","https://openalex.org/W3040652553","https://openalex.org/W3174032342","https://openalex.org/W3176265013","https://openalex.org/W3192708540","https://openalex.org/W3192815666","https://openalex.org/W3193101426","https://openalex.org/W3203076355","https://openalex.org/W3208809545","https://openalex.org/W4214717370","https://openalex.org/W4226309189","https://openalex.org/W4290948528","https://openalex.org/W4382202546","https://openalex.org/W4385245566","https://openalex.org/W6691766336","https://openalex.org/W6738796088","https://openalex.org/W6749304979","https://openalex.org/W6751139674","https://openalex.org/W6752380930","https://openalex.org/W6755069753","https://openalex.org/W6758846586","https://openalex.org/W6762491519","https://openalex.org/W6766390276","https://openalex.org/W6767327128","https://openalex.org/W6768539364","https://openalex.org/W6769462197","https://openalex.org/W6771904302","https://openalex.org/W6773690109","https://openalex.org/W6775529125","https://openalex.org/W6778102432","https://openalex.org/W6781210820","https://openalex.org/W6781750019","https://openalex.org/W6783196708","https://openalex.org/W6783940979","https://openalex.org/W6784046417","https://openalex.org/W6784152626","https://openalex.org/W6784778700","https://openalex.org/W6787618087","https://openalex.org/W6788165329","https://openalex.org/W6795826604","https://openalex.org/W6795908048","https://openalex.org/W6795975040","https://openalex.org/W6796258226","https://openalex.org/W6796333922","https://openalex.org/W6796436736","https://openalex.org/W6796664490","https://openalex.org/W6797233888","https://openalex.org/W6797584944","https://openalex.org/W6800682094","https://openalex.org/W6802002411","https://openalex.org/W6803290710","https://openalex.org/W6803595505","https://openalex.org/W6810079014","https://openalex.org/W6810518622","https://openalex.org/W6810655720","https://openalex.org/W6839455583","https://openalex.org/W6840380725","https://openalex.org/W6922480057"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W3107602296","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W2033914206"],"abstract_inverted_index":{"Deep":[0],"cooperative":[1],"multi-agent":[2,22],"reinforcement":[3],"learning":[4,23],"has":[5],"demonstrated":[6],"its":[7],"remarkable":[8],"success":[9],"over":[10],"a":[11,50,74,100,121],"wide":[12],"spectrum":[13],"of":[14,66,76,156],"complex":[15],"control":[16],"tasks.":[17],"However,":[18],"recent":[19],"advances":[20],"in":[21],"mainly":[24],"focus":[25],"on":[26,40,160],"value":[27],"decomposition":[28],"while":[29],"leaving":[30],"entity":[31,60],"interactions":[32,42,61,84],"still":[33],"intertwined,":[34],"which":[35,67],"easily":[36],"leads":[37],"to":[38,57,104,143,174],"over-fitting":[39],"noisy":[41,83],"between":[43,85,148],"entities.":[44,78],"In":[45],"this":[46],"work,":[47],"we":[48,141],"introduce":[49],"novel":[51],"interactiOn":[52],"Pattern":[53],"disenTangling":[54],"(OPT)":[55],"method,":[56],"disentangle":[58],"the":[59,77,82,114,133,145,149,153,168,175],"into":[62,120],"interaction":[63,71,111,123],"prototypes,":[64],"each":[65,157],"represents":[68],"an":[69,126],"underlying":[70],"pattern":[72,124],"within":[73],"subgroup":[75],"OPT":[79,98],"facilitates":[80],"filtering":[81],"irrelevant":[86],"entities":[87],"and":[88,107,152,163],"thus":[89],"significantly":[90],"improves":[91],"generalizability":[92],"as":[93,95],"well":[94],"interpretability.":[96],"Specifically,":[97],"introduces":[99],"sparse":[101],"disagreement":[102],"mechanism":[103],"encourage":[105],"sparsity":[106],"diversity":[108],"among":[109],"discovered":[110],"prototypes.":[112],"Then":[113],"model":[115],"selectively":[116],"restructures":[117],"these":[118],"prototypes":[119],"compact":[122],"by":[125,138],"aggregator":[127],"with":[128],"learnable":[129],"weights.":[130],"To":[131],"alleviate":[132],"training":[134],"instability":[135],"issue":[136],"caused":[137],"partial":[139],"observability,":[140],"propose":[142],"maximize":[144],"mutual":[146],"information":[147],"aggregation":[150],"weights":[151],"history":[154],"behaviors":[155],"agent.":[158],"Experiments":[159],"single-task,":[161],"multi-task":[162],"zero-shot":[164],"benchmarks":[165],"demonstrate":[166],"that":[167],"proposed":[169],"method":[170],"yields":[171],"results":[172],"superior":[173],"state-of-the-art":[176],"counterparts.":[177]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
