{"id":"https://openalex.org/W7131834671","doi":"https://doi.org/10.48550/arxiv.2602.22959","title":"Can Agents Distinguish Visually Hard-to-Separate Diseases in a Zero-Shot Setting? A Pilot Study","display_name":"Can Agents Distinguish Visually Hard-to-Separate Diseases in a Zero-Shot Setting? A Pilot Study","publication_year":2026,"publication_date":"2026-02-26","ids":{"openalex":"https://openalex.org/W7131834671","doi":"https://doi.org/10.48550/arxiv.2602.22959"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.22959","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127179587","display_name":"Zihao Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhao, Zihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084592753","display_name":"Frederik Hauke","orcid":"https://orcid.org/0000-0003-3434-5720"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hauke, Frederik","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127094696","display_name":"Juliana De Castilhos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"De Castilhos, Juliana","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5117184858","display_name":"Sven Nebelung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nebelung, Sven","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5033991658","display_name":"H. Scharr","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Truhn, Daniel","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5127179587"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10392","display_name":"Cutaneous Melanoma Detection and Management","score":0.392300009727478,"subfield":{"id":"https://openalex.org/subfields/2730","display_name":"Oncology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10392","display_name":"Cutaneous Melanoma Detection and Management","score":0.392300009727478,"subfield":{"id":"https://openalex.org/subfields/2730","display_name":"Oncology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.18559999763965607,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.04529999941587448,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/medical-diagnosis","display_name":"Medical diagnosis","score":0.4674000144004822},{"id":"https://openalex.org/keywords/crowdsourcing","display_name":"Crowdsourcing","score":0.3700000047683716},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.33219999074935913},{"id":"https://openalex.org/keywords/diagnostic-test","display_name":"Diagnostic test","score":0.30480000376701355},{"id":"https://openalex.org/keywords/limit","display_name":"Limit (mathematics)","score":0.2847000062465668},{"id":"https://openalex.org/keywords/diagnostic-accuracy","display_name":"Diagnostic accuracy","score":0.2667999863624573}],"concepts":[{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.5393000245094299},{"id":"https://openalex.org/C534262118","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Medical diagnosis","level":2,"score":0.4674000144004822},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42829999327659607},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.3700000047683716},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.36010000109672546},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.33219999074935913},{"id":"https://openalex.org/C82157600","wikidata":"https://www.wikidata.org/wiki/Q2671652","display_name":"Diagnostic test","level":2,"score":0.30480000376701355},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.2847000062465668},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2703000009059906},{"id":"https://openalex.org/C19527891","wikidata":"https://www.wikidata.org/wiki/Q1120908","display_name":"Medical physics","level":1,"score":0.2671999931335449},{"id":"https://openalex.org/C3020132585","wikidata":"https://www.wikidata.org/wiki/Q2671652","display_name":"Diagnostic accuracy","level":2,"score":0.2667999863624573},{"id":"https://openalex.org/C3018587665","wikidata":"https://www.wikidata.org/wiki/Q7268696","display_name":"Qualitative analysis","level":3,"score":0.26649999618530273},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25870001316070557},{"id":"https://openalex.org/C2983449737","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Clinical diagnosis","level":2,"score":0.25189998745918274}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.22959","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.22959","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22959","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.22959","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"rapid":[1],"progress":[2],"of":[3,128],"multimodal":[4],"large":[5],"language":[6],"models":[7],"(MLLMs)":[8],"has":[9],"led":[10],"to":[11,136],"increasing":[12],"interest":[13],"in":[14,21,42,76,97,122,153],"agent-based":[15],"systems.":[16],"While":[17],"most":[18],"prior":[19],"work":[20],"medical":[22],"imaging":[23],"concentrates":[24],"on":[25,50,85,99,106],"automating":[26],"routine":[27],"clinical":[28,77,115,129],"workflows,":[29],"we":[30],"study":[31,145],"an":[32],"underexplored":[33],"yet":[34],"clinically":[35],"significant":[36],"setting:":[37],"distinguishing":[38],"visually":[39,154],"hard-to-separate":[40],"diseases":[41],"a":[43,81],"zero-shot":[44,150],"setting.":[45],"We":[46,79,117],"benchmark":[47],"representative":[48],"agents":[49],"two":[51],"imaging-only":[52],"proxy":[53],"diagnostic":[54,92],"tasks,":[55],"(1)":[56],"melanoma":[57],"vs.":[58,65],"atypical":[59],"nevus":[60],"and":[61,102,125],"(2)":[62],"pulmonary":[63],"edema":[64],"pneumonia,":[66],"where":[67],"visual":[68],"features":[69],"are":[70],"highly":[71],"confounded":[72,155],"despite":[73],"substantial":[74],"differences":[75],"management.":[78],"introduce":[80],"multi-agent":[82],"framework":[83],"based":[84],"contrastive":[86],"adjudication.":[87],"Experimental":[88],"results":[89],"show":[90],"improved":[91],"performance":[93,111,152],"(an":[94],"11-percentage-point":[95],"gain":[96],"accuracy":[98],"dermoscopy":[100],"data)":[101],"reduced":[103],"unsupported":[104],"claims":[105],"qualitative":[107],"samples,":[108],"although":[109],"overall":[110],"remains":[112],"insufficient":[113],"for":[114],"deployment.":[116],"acknowledge":[118],"the":[119,126,134],"inherent":[120],"uncertainty":[121],"human":[123],"annotations":[124],"absence":[127],"context,":[130],"which":[131],"further":[132],"limit":[133],"translation":[135],"real-world":[137],"settings.":[138],"Within":[139],"this":[140,143],"controlled":[141],"setting,":[142],"pilot":[144],"provides":[146],"preliminary":[147],"insights":[148],"into":[149],"agent":[151],"scenarios.":[156]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-28T00:00:00"}
