{"id":"https://openalex.org/W4407123512","doi":"https://doi.org/10.48550/arxiv.2502.00345","title":"The Composite Task Challenge for Cooperative Multi-Agent Reinforcement Learning","display_name":"The Composite Task Challenge for Cooperative Multi-Agent Reinforcement Learning","publication_year":2025,"publication_date":"2025-02-01","ids":{"openalex":"https://openalex.org/W4407123512","doi":"https://doi.org/10.48550/arxiv.2502.00345"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2502.00345","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.00345","pdf_url":"https://arxiv.org/pdf/2502.00345","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2502.00345","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102756396","display_name":"Yurui Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Yurui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100342243","display_name":"Yuxuan Chen","orcid":"https://orcid.org/0000-0002-3044-4169"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yuxuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100418968","display_name":"Zhang Li","orcid":"https://orcid.org/0000-0003-1659-0466"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103196339","display_name":"Shijian Li","orcid":"https://orcid.org/0000-0001-5846-3065"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Shijian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101975457","display_name":"Gang Pan","orcid":"https://orcid.org/0000-0003-2155-4689"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Gang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5102756396"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.7325000166893005,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.7325000166893005,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7651951909065247},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6272174119949341},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.6040248870849609},{"id":"https://openalex.org/keywords/composite-number","display_name":"Composite number","score":0.5186611413955688},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.42320847511291504},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.308168888092041},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2053355574607849},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14292126893997192},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.0958254337310791},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.058317720890045166}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7651951909065247},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6272174119949341},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.6040248870849609},{"id":"https://openalex.org/C104779481","wikidata":"https://www.wikidata.org/wiki/Q50707","display_name":"Composite number","level":2,"score":0.5186611413955688},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.42320847511291504},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.308168888092041},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2053355574607849},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14292126893997192},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0958254337310791},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.058317720890045166},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2502.00345","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.00345","pdf_url":"https://arxiv.org/pdf/2502.00345","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2502.00345","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2502.00345","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2502.00345","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.00345","pdf_url":"https://arxiv.org/pdf/2502.00345","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4407123512.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291","https://openalex.org/W1987513656"],"abstract_inverted_index":{"The":[0],"significant":[1],"role":[2],"of":[3,5,27,59,71,79,104,140,171,179,195,198],"division":[4],"labor":[6],"(DOL)":[7],"in":[8,14,37,62,82],"promoting":[9],"cooperation":[10,31,125],"is":[11,46,86,204],"widely":[12],"recognized":[13],"real-world":[15,83,113],"applications.Many":[16],"cooperative":[17,150],"multi-agent":[18,94],"reinforcement":[19],"learning":[20],"(MARL)":[21],"methods":[22,64,81,152],"have":[23],"incorporated":[24],"the":[25,34,56,69,75,116,138,154,169,196,199],"concept":[26,61],"DOL":[28,45,60,95,123],"to":[29,42,68,89,107,136,143,188],"improve":[30],"among":[32],"agents.However,":[33],"tasks":[35,43,91,105,131,142],"used":[36],"existing":[38],"testbeds":[39],"typically":[40],"correspond":[41],"where":[44],"often":[47],"not":[48],"a":[49,87,102],"necessary":[50,88,127],"feature":[51],"for":[52,118,129],"achieving":[53],"optimal":[54],"policies.Additionally,":[55],"full":[57],"utilize":[58],"MARL":[63,80,151],"remains":[65],"unrealized":[66],"due":[67],"absence":[70],"appropriate":[72],"tasks.To":[73,166],"enhance":[74],"generality":[76],"and":[77,96,124,132],"applicability":[78],"scenarios,":[84],"there":[85],"develop":[90],"that":[92,122,159,184],"demand":[93],"cooperation.In":[97],"this":[98],"paper,":[99],"we":[100,174],"propose":[101,176],"series":[103],"designed":[106],"meet":[108],"these":[109,165,172,190],"requirements,":[110],"drawing":[111],"on":[112,153,164],"rules":[114],"as":[115],"guidance":[117],"their":[119],"design.We":[120],"guarantee":[121],"are":[126,186],"condition":[128],"completing":[130],"introduce":[133],"three":[134],"factors":[135],"expand":[137],"diversity":[139],"proposed":[141,155,180,200],"cover":[144],"more":[145],"realistic":[146],"situations.We":[147],"evaluate":[148],"10":[149],"tasks.The":[156,201],"results":[157,182],"indicate":[158],"all":[160],"baselines":[161,185],"perform":[162],"poorly":[163],"further":[167],"validate":[168],"solvability":[170,197],"tasks,":[173],"also":[175],"simplified":[177,191],"variants":[178],"tasks.Experimental":[181],"show":[183],"able":[187],"handle":[189],"variants,":[192],"providing":[193],"evidence":[194],"source":[202],"files":[203],"available":[205],"at":[206],"https://github.com/Yurui-Li/CTC.":[207]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
