{"id":"https://openalex.org/W7134917643","doi":"https://doi.org/10.48550/arxiv.2603.09909","title":"MedMASLab: A Unified Orchestration Framework for Benchmarking Multimodal Medical Multi-Agent Systems","display_name":"MedMASLab: A Unified Orchestration Framework for Benchmarking Multimodal Medical Multi-Agent Systems","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7134917643","doi":"https://doi.org/10.48550/arxiv.2603.09909"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.09909","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09909","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.09909","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110444350","display_name":"Yazhuo Qian","orcid":"https://orcid.org/0009-0007-8544-6114"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Qian, Yunhang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128788069","display_name":"Xiaobin Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Xiaobin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128721363","display_name":"Jiaquan Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Jiaquan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128770280","display_name":"Siyang Xin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xin, Siyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126098387","display_name":"Xiaokun Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Xiaokun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128770343","display_name":"Jiangning Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jiangning","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062345781","display_name":"Peng-Tao Jiang","orcid":"https://orcid.org/0000-0002-1786-4943"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Peng-Tao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128731491","display_name":"Jiawei Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jiawei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128800254","display_name":"Hongwei Bran Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Hongwei Bran","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5110444350"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.2110999971628189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.2110999971628189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.12060000002384186,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.10769999772310257,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7612000107765198},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.42820000648498535},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.412200003862381},{"id":"https://openalex.org/keywords/protocol","display_name":"Protocol (science)","score":0.3822000026702881},{"id":"https://openalex.org/keywords/orchestration","display_name":"Orchestration","score":0.3555999994277954},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.29679998755455017}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7612000107765198},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7304999828338623},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.5105000138282776},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.42820000648498535},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.412200003862381},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4034000039100647},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.3822000026702881},{"id":"https://openalex.org/C199168358","wikidata":"https://www.wikidata.org/wiki/Q3367000","display_name":"Orchestration","level":3,"score":0.3555999994277954},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.31130000948905945},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.29679998755455017},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.28360000252723694},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2822999954223633},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2689000070095062},{"id":"https://openalex.org/C12269588","wikidata":"https://www.wikidata.org/wiki/Q132364","display_name":"Communications protocol","level":2,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.09909","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09909","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.09909","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09909","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.42462947964668274,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"Multi-Agent":[1],"Systems":[2],"(MAS)":[3],"show":[4],"potential":[5],"for":[6,57,175],"complex":[7],"clinical":[8,87,132,178],"decision":[9],"support,":[10],"the":[11,19,97],"field":[12],"remains":[13],"hindered":[14],"by":[15,102],"architectural":[16],"fragmentation":[17],"and":[18,38,54,111,125,167,183],"lack":[20,40],"of":[21,41,75,99,164],"standardized":[22,66],"multimodal":[23,58,67],"integration.":[24],"Current":[25],"medical":[26,59,82,157],"MAS":[27,78,144],"research":[28],"suffers":[29],"from":[30,130],"non-uniform":[31],"data":[32,129,184],"ingestion":[33],"pipelines,":[34],"inconsistent":[35],"visual-reasoning":[36],"evaluation,":[37],"a":[39,51,90,138,161,171],"cross-specialty":[42],"benchmarking.":[43],"To":[44],"address":[45],"these":[46],"challenges,":[47],"we":[48],"present":[49],"MedMASLab,":[50],"unified":[52],"framework":[53],"benchmarking":[55],"platform":[56],"multi-agent":[60],"systems.":[61,179],"MedMASLab":[62],"introduces:":[63],"(1)":[64],"A":[65],"agent":[68],"communication":[69],"protocol":[70],"that":[71,95],"enables":[72],"seamless":[73],"integration":[74],"11":[76,122,131],"heterogeneous":[77],"architectures":[79,149],"across":[80],"24":[81],"modalities.":[83],"(2)":[84],"An":[85],"automated":[86],"reasoning":[88,146],"evaluator,":[89],"zero-shot":[91],"semantic":[92],"evaluation":[93,136],"paradigm":[94],"overcomes":[96],"limitations":[98],"lexical":[100],"string-matching":[101],"leveraging":[103],"large":[104],"vision-language":[105],"models":[106],"to":[107,119],"verify":[108],"diagnostic":[109],"logic":[110],"visual":[112],"grounding.":[113],"(3)":[114],"The":[115,180],"most":[116],"extensive":[117],"benchmark":[118],"date,":[120],"spanning":[121],"organ":[123],"systems":[124],"473":[126],"diseases,":[127],"standardizing":[128],"benchmarks.":[133],"Our":[134],"systematic":[135],"reveals":[137],"critical":[139],"domain-specific":[140],"performance":[141],"gap:":[142],"while":[143],"improves":[145],"depth,":[147],"current":[148],"exhibit":[150],"significant":[151],"fragility":[152],"when":[153],"transitioning":[154],"between":[155],"specialized":[156],"sub-domains.":[158],"We":[159],"provide":[160],"rigorous":[162],"ablation":[163],"interaction":[165],"mechanisms":[166],"cost-performance":[168],"trade-offs,":[169],"establishing":[170],"new":[172],"technical":[173],"baseline":[174],"future":[176],"autonomous":[177],"source":[181],"code":[182],"is":[185],"publicly":[186],"available":[187],"at:":[188],"https://github.com/NUS-Project/MedMASLab/":[189]},"counts_by_year":[],"updated_date":"2026-03-12T06:18:43.230356","created_date":"2026-03-12T00:00:00"}
