{"id":"https://openalex.org/W7161142988","doi":"https://doi.org/10.48550/arxiv.2605.12943","title":"Reinforced Collaboration in Multi-Agent Flow Networks","display_name":"Reinforced Collaboration in Multi-Agent Flow Networks","publication_year":2026,"publication_date":"2026-05-13","ids":{"openalex":"https://openalex.org/W7161142988","doi":"https://doi.org/10.48550/arxiv.2605.12943"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.12943","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.12943","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.12943","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136089935","display_name":"Zheng Wang","orcid":"https://orcid.org/0000-0001-8016-1098"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136119553","display_name":"Yuang Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yuang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136164016","display_name":"Yangkai Ding","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Yangkai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.20160000026226044,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.20160000026226044,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1889999955892563,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.11749999970197678,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.8447999954223633},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6383000016212463},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.6291000247001648},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6118999719619751},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5633000135421753},{"id":"https://openalex.org/keywords/flow-network","display_name":"Flow network","score":0.38269999623298645},{"id":"https://openalex.org/keywords/flow","display_name":"Flow (mathematics)","score":0.37770000100135803}],"concepts":[{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.8447999954223633},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7784000039100647},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6383000016212463},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.6291000247001648},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6118999719619751},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5633000135421753},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4830000102519989},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3903999924659729},{"id":"https://openalex.org/C114809511","wikidata":"https://www.wikidata.org/wiki/Q1412924","display_name":"Flow network","level":2,"score":0.38269999623298645},{"id":"https://openalex.org/C38349280","wikidata":"https://www.wikidata.org/wiki/Q1434290","display_name":"Flow (mathematics)","level":2,"score":0.37770000100135803},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.3774999976158142},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.36160001158714294},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.32899999618530273},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.30820000171661377},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.29829999804496765},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2944999933242798},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2858999967575073},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27810001373291016},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2596000134944916},{"id":"https://openalex.org/C160191386","wikidata":"https://www.wikidata.org/wiki/Q868299","display_name":"Control flow","level":2,"score":0.25380000472068787}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.12943","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.12943","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.12943","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.12943","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.4252128601074219}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multi-agent":[0],"systems":[1],"provide":[2],"a":[3,14,65,75,99],"powerful":[4],"way":[5],"to":[6,90,105,121,135],"extend":[7],"large":[8],"language":[9],"models":[10],"(LLMs)":[11],"by":[12,21,30,130],"decomposing":[13],"complex":[15],"task":[16],"into":[17],"specialized":[18],"subtasks":[19],"handled":[20],"different":[22],"agents.":[23],"However,":[24],"their":[25],"performance":[26,123],"is":[27],"often":[28],"hindered":[29],"error":[31],"propagation,":[32],"arising":[33],"from":[34,79],"suboptimal":[35],"workflow":[36,93],"design":[37],"or":[38],"inaccurate":[39],"agent":[40,47,72,96],"outputs,":[41],"which":[42],"can":[43],"propagate":[44],"through":[45],"the":[46,56],"collaboration":[48,73],"process":[49],"and":[50,70,87,95,132,140],"degrade":[51],"final":[52],"results.":[53],"To":[54],"address":[55],"challenges,":[57],"we":[58],"present":[59],"MANGO":[60,83,118],"(Multi-Agent":[61],"Network":[62],"Gradient":[63],"Optimization),":[64],"data-driven":[66],"framework":[67],"that":[68,117],"organizes":[69],"refines":[71],"via":[74],"flow":[76],"network":[77],"constructed":[78],"past":[80],"successful":[81],"workflows.":[82],"integrates":[84],"reinforcement":[85],"learning":[86],"textual":[88],"gradients":[89],"jointly":[91],"optimize":[92],"paths":[94],"behaviors,":[97],"while":[98],"skipping":[100],"mechanism":[101],"prevents":[102],"redundant":[103],"updates":[104],"well-optimized":[106],"agents":[107],"for":[108],"improving":[109],"efficiency.":[110],"Extensive":[111],"experiments":[112],"on":[113],"seven":[114],"benchmarks":[115],"show":[116],"achieves":[119],"up":[120],"12.8%":[122],"improvement":[124],"over":[125],"state-of-the-art":[126],"baselines,":[127],"enhances":[128],"efficiency":[129],"47.4%,":[131],"generalizes":[133],"effectively":[134],"unseen":[136],"domains.":[137],"Our":[138],"code":[139],"datasets":[141],"are":[142],"publicly":[143],"available":[144],"at":[145],"https://github.com/openJiuwen-ai/agent-store/tree/main/community/mango.":[146]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-15T00:00:00"}
