{"id":"https://openalex.org/W6966785682","doi":"https://doi.org/10.48550/arxiv.2507.05520","title":"Architecting Clinical Collaboration: Multi-Agent Reasoning Systems for Multimodal Medical VQA","display_name":"Architecting Clinical Collaboration: Multi-Agent Reasoning Systems for Multimodal Medical VQA","publication_year":2025,"publication_date":"2025-07-07","ids":{"openalex":"https://openalex.org/W6966785682","doi":"https://doi.org/10.48550/arxiv.2507.05520"},"language":"en","primary_location":{"id":"doi:10.48550/arxiv.2507.05520","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.05520","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2507.05520","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Thakrar, Karishma","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Thakrar, Karishma","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Basavatia, Shreyas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Basavatia, Shreyas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Daftardar, Akshay","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Daftardar, Akshay","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8288000226020813,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8288000226020813,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.02199999988079071,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.02160000056028366,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/medical-diagnosis","display_name":"Medical diagnosis","score":0.7160000205039978},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5863999724388123},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.48539999127388},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.46389999985694885},{"id":"https://openalex.org/keywords/expert-system","display_name":"Expert system","score":0.41819998621940613},{"id":"https://openalex.org/keywords/telemedicine","display_name":"Telemedicine","score":0.382999986410141},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.3677999973297119},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.35839998722076416}],"concepts":[{"id":"https://openalex.org/C534262118","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Medical diagnosis","level":2,"score":0.7160000205039978},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5863999724388123},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5723000168800354},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.48539999127388},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47530001401901245},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.46389999985694885},{"id":"https://openalex.org/C58328972","wikidata":"https://www.wikidata.org/wiki/Q184609","display_name":"Expert system","level":2,"score":0.41819998621940613},{"id":"https://openalex.org/C2779891985","wikidata":"https://www.wikidata.org/wiki/Q46994","display_name":"Telemedicine","level":3,"score":0.382999986410141},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.3677999973297119},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.35839998722076416},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.3416000008583069},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.33329999446868896},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3151000142097473},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.30820000171661377},{"id":"https://openalex.org/C535046627","wikidata":"https://www.wikidata.org/wiki/Q30612","display_name":"Clinical trial","level":2,"score":0.2944999933242798},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2939999997615814},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.28060001134872437},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.2784999907016754},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C107327155","wikidata":"https://www.wikidata.org/wiki/Q330268","display_name":"Decision support system","level":2,"score":0.26570001244544983},{"id":"https://openalex.org/C3018838755","wikidata":"https://www.wikidata.org/wiki/Q31207","display_name":"Medical care","level":2,"score":0.259799987077713},{"id":"https://openalex.org/C2779473830","wikidata":"https://www.wikidata.org/wiki/Q1540899","display_name":"MEDLINE","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C63527458","wikidata":"https://www.wikidata.org/wiki/Q5133829","display_name":"Clinical decision support system","level":3,"score":0.2587999999523163},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.25540000200271606},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2507.05520","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.05520","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2507.05520","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.05520","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Dermatological":[0],"care":[1],"via":[2],"telemedicine":[3],"often":[4],"lacks":[5],"the":[6,26,165],"rich":[7],"context":[8],"of":[9,20,28,120],"in-person":[10],"visits.":[11],"Clinicians":[12],"must":[13],"make":[14],"diagnoses":[15],"based":[16],"on":[17,70,131,144],"a":[18,59,109],"handful":[19],"images":[21],"and":[22,82,167],"brief":[23],"descriptions,":[24],"without":[25],"benefit":[27],"physical":[29],"exams,":[30],"second":[31],"opinions,":[32],"or":[33,98],"reference":[34],"materials.":[35],"While":[36,114],"many":[37],"medical":[38,71,103,160],"AI":[39,161],"systems":[40],"attempt":[41],"to":[42,95,112,139,171],"bridge":[43],"these":[44],"gaps":[45],"with":[46,85,123],"domain-specific":[47],"fine-tuning,":[48],"this":[49],"work":[50],"hypothesized":[51],"that":[52,89,101,159],"mimicking":[53],"clinical":[54,154,172],"reasoning":[55,87],"processes":[56],"could":[57],"offer":[58],"more":[60],"effective":[61],"path":[62],"forward.":[63],"This":[64],"study":[65],"tested":[66],"seven":[67,121],"vision-language":[68],"models":[69,122,129],"visual":[72],"question":[73],"answering":[74],"across":[75],"six":[76],"configurations:":[77],"baseline":[78,128],"models,":[79],"fine-tuned":[80],"variants,":[81],"both":[83],"augmented":[84],"either":[86],"layers":[88],"combine":[90],"multiple":[91],"model":[92],"perspectives,":[93],"analogous":[94],"peer":[96],"consultation,":[97],"retrieval-augmented":[99],"generation":[100],"incorporates":[102],"literature":[104],"at":[105],"inference":[106],"time,":[107],"serving":[108],"role":[110],"similar":[111],"reference-checking.":[113],"fine-tuning":[115],"degraded":[116],"performance":[117,143],"in":[118],"four":[119],"an":[124],"average":[125],"30%":[126],"decrease,":[127],"collapsed":[130],"test":[132],"data.":[133],"Clinical-inspired":[134],"architectures,":[135],"meanwhile,":[136],"achieved":[137],"up":[138],"70%":[140],"accuracy,":[141],"maintaining":[142],"unseen":[145],"data":[146],"while":[147],"generating":[148],"explainable,":[149],"literature-grounded":[150],"outputs":[151],"critical":[152],"for":[153],"adoption.":[155],"These":[156],"findings":[157],"demonstrate":[158],"succeeds":[162],"by":[163],"reconstructing":[164],"collaborative":[166],"evidence-based":[168],"practices":[169],"fundamental":[170],"diagnosis.":[173]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
