{"id":"https://openalex.org/W4399801175","doi":"https://doi.org/10.1109/tnnls.2024.3394513","title":"Multiagent Continual Coordination via Progressive Task Contextualization","display_name":"Multiagent Continual Coordination via Progressive Task Contextualization","publication_year":2024,"publication_date":"2024-06-19","ids":{"openalex":"https://openalex.org/W4399801175","doi":"https://doi.org/10.1109/tnnls.2024.3394513","pmid":"https://pubmed.ncbi.nlm.nih.gov/38896515"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2024.3394513","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3394513","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041768936","display_name":"Lei Yuan","orcid":"https://orcid.org/0000-0002-7803-0766"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lei Yuan","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-7803-0766","affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049063919","display_name":"Lihe Li","orcid":"https://orcid.org/0000-0002-7017-6488"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lihe Li","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-7017-6488","affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005123740","display_name":"Ziqian Zhang","orcid":"https://orcid.org/0000-0002-0570-4969"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziqian Zhang","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-0570-4969","affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101627473","display_name":"Fuxiang Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fuxiang Zhang","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058506037","display_name":"Cong Guan","orcid":"https://orcid.org/0000-0002-5198-9141"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cong Guan","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-5198-9141","affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101458462","display_name":"Yang Yu","orcid":"https://orcid.org/0000-0002-1052-5447"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Yu","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-1052-5447","affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5041768936"],"corresponding_institution_ids":["https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":0.9934,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.79255905,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":"36","issue":"4","first_page":"6326","last_page":"6340"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9812999963760376,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9277999997138977,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7618499398231506},{"id":"https://openalex.org/keywords/contextualization","display_name":"Contextualization","score":0.7130424976348877},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6272736191749573},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6223205924034119},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5394260883331299},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.45309239625930786},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4145236015319824},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3888489603996277},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3290560245513916},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09087160229682922},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.08616247773170471}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7618499398231506},{"id":"https://openalex.org/C2780712339","wikidata":"https://www.wikidata.org/wiki/Q5165204","display_name":"Contextualization","level":3,"score":0.7130424976348877},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6272736191749573},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6223205924034119},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5394260883331299},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.45309239625930786},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4145236015319824},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3888489603996277},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3290560245513916},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09087160229682922},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.08616247773170471},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2024.3394513","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3394513","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:38896515","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38896515","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4366907579","display_name":null,"funder_award_id":"2020AAA0107200","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G528746023","display_name":null,"funder_award_id":"61921006","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5635164781","display_name":null,"funder_award_id":"62022039","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W2089468765","https://openalex.org/W2099618002","https://openalex.org/W2116064496","https://openalex.org/W2157364932","https://openalex.org/W2560647685","https://openalex.org/W2747213132","https://openalex.org/W2788388592","https://openalex.org/W2892258706","https://openalex.org/W2950635152","https://openalex.org/W2968526727","https://openalex.org/W2991046523","https://openalex.org/W3046093665","https://openalex.org/W3117215073","https://openalex.org/W3153573172","https://openalex.org/W3165631200","https://openalex.org/W3170823761","https://openalex.org/W3173211893","https://openalex.org/W3174406242","https://openalex.org/W3175458185","https://openalex.org/W3196869853","https://openalex.org/W3205279237","https://openalex.org/W3210169707","https://openalex.org/W4213246061","https://openalex.org/W4220822815","https://openalex.org/W4220918847","https://openalex.org/W4224317003","https://openalex.org/W4224874620","https://openalex.org/W4282944715","https://openalex.org/W4308365139","https://openalex.org/W4313131480","https://openalex.org/W4365459358","https://openalex.org/W4385245566","https://openalex.org/W4388317804","https://openalex.org/W4390638728","https://openalex.org/W4390951782","https://openalex.org/W4391259941","https://openalex.org/W4400994346","https://openalex.org/W4402618490","https://openalex.org/W6738796088","https://openalex.org/W6741087337","https://openalex.org/W6749304979","https://openalex.org/W6752380930","https://openalex.org/W6756754374","https://openalex.org/W6758846586","https://openalex.org/W6760539816","https://openalex.org/W6762491519","https://openalex.org/W6763462227","https://openalex.org/W6763484891","https://openalex.org/W6771640813","https://openalex.org/W6774673717","https://openalex.org/W6779043139","https://openalex.org/W6781750019","https://openalex.org/W6791040878","https://openalex.org/W6791079441","https://openalex.org/W6791129655","https://openalex.org/W6796436736","https://openalex.org/W6802325372","https://openalex.org/W6803204313","https://openalex.org/W6803595505","https://openalex.org/W6810079014","https://openalex.org/W6838682728","https://openalex.org/W6840380725","https://openalex.org/W6842091875","https://openalex.org/W6842690010","https://openalex.org/W6843745752","https://openalex.org/W6846406187","https://openalex.org/W6846528917","https://openalex.org/W6846722307"],"related_works":["https://openalex.org/W1687432146","https://openalex.org/W1591874556","https://openalex.org/W2185608106","https://openalex.org/W3046258185","https://openalex.org/W1548083239","https://openalex.org/W3216994056","https://openalex.org/W2268232908","https://openalex.org/W2146570735","https://openalex.org/W205610463","https://openalex.org/W4296050054"],"abstract_inverted_index":{"Cooperative":[0],"multiagent":[1,77,164],"reinforcement":[2],"learning":[3,169],"(MARL)":[4],"has":[5,10],"attracted":[6],"significant":[7],"attention":[8],"and":[9,31,145],"the":[11,23,40,53,69,121,129,147,184],"potential":[12],"for":[13],"many":[14],"real-world":[15],"applications.":[16],"Previous":[17],"arts":[18],"mainly":[19],"focus":[20],"on":[21,120,153],"facilitating":[22],"coordination":[24,55,79],"ability":[25],"from":[26,188],"different":[27],"aspects":[28],"(e.g.,":[29],"nonstationarity":[30],"credit":[32],"assignment)":[33],"in":[34,46,60,89,106,138,156,162],"single-task":[35],"or":[36],"multitask":[37],"scenarios,":[38],"ignoring":[39],"stream":[41],"of":[42,110,186],"tasks":[43],"that":[44,166],"appear":[45],"a":[47,91,107,157],"continual":[48,54,78,168],"manner.":[49,159],"This":[50],"ignorance":[51],"makes":[52],"an":[56,75],"unexplored":[57],"territory,":[58],"neither":[59],"problem":[61],"formulation":[62],"nor":[63],"efficient":[64],"algorithms":[65],"designed.":[66],"Toward":[67],"tackling":[68],"mentioned":[70],"issue,":[71],"this":[72],"article":[73],"proposes":[74],"approach,":[76],"via":[80],"progressive":[81],"task":[82,102,113,123],"contextualization":[83],"(MACPro).":[84],"The":[85,112],"key":[86],"point":[87],"lies":[88],"obtaining":[90],"factorized":[92],"policy,":[93],"using":[94],"shared":[95],"feature":[96],"extraction":[97],"layers":[98],"but":[99],"separated":[100],"independent":[101],"heads,":[103],"each":[104,140],"specializing":[105],"specific":[108],"class":[109],"tasks.":[111],"heads":[114],"can":[115],"be":[116],"progressively":[117],"expanded":[118],"based":[119,152],"learned":[122],"contextualization.":[124],"Moreover,":[125],"to":[126,128,143,176],"cater":[127],"popular":[130],"centralized":[131],"training":[132],"with":[133],"decentralized":[134,158],"execution":[135],"(CTDE)":[136],"paradigm":[137],"MARL,":[139],"agent":[141],"learns":[142],"predict":[144],"adopt":[146],"most":[148],"relevant":[149],"policy":[150],"head":[151],"local":[154],"information":[155],"We":[160],"show":[161],"multiple":[163,189],"benchmarks":[165],"existing":[167],"methods":[170],"fail,":[171],"while":[172],"MACPro":[173,187],"is":[174],"able":[175],"achieve":[177],"close-to-optimal":[178],"performance.":[179],"More":[180],"results":[181],"also":[182],"disclose":[183],"effectiveness":[185],"aspects,":[190],"such":[191],"as":[192],"high":[193],"generalization":[194],"ability.":[195]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
