{"id":"https://openalex.org/W7127311890","doi":"https://doi.org/10.48550/arxiv.2602.01081","title":"MedAD-R1: Eliciting Consistent Reasoning in Interpretible Medical Anomaly Detection via Consistency-Reinforced Policy Optimization","display_name":"MedAD-R1: Eliciting Consistent Reasoning in Interpretible Medical Anomaly Detection via Consistency-Reinforced Policy Optimization","publication_year":2026,"publication_date":"2026-02-01","ids":{"openalex":"https://openalex.org/W7127311890","doi":"https://doi.org/10.48550/arxiv.2602.01081"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.01081","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124895187","display_name":"Haitao Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Haitao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124936672","display_name":"Yingying Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yingying","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124939113","display_name":"Jiaxiang Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Jiaxiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124935980","display_name":"Haote Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Haote","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124903296","display_name":"Hongyang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Hongyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124966852","display_name":"Yirong Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yirong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124912602","display_name":"Yue Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Yue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5110603747","display_name":"Xinghao Ding","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Xinghao","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5124895187"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.4115999937057495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.4115999937057495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.3093999922275543,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.04410000145435333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.9226999878883362},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.7236999869346619},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.6122999787330627},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6010000109672546},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.520799994468689},{"id":"https://openalex.org/keywords/trustworthiness","display_name":"Trustworthiness","score":0.41440001130104065}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.9226999878883362},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.7236999869346619},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6959999799728394},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6395000219345093},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.6122999787330627},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6092000007629395},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6010000109672546},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.520799994468689},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.41440001130104065},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.3788999915122986},{"id":"https://openalex.org/C12997251","wikidata":"https://www.wikidata.org/wiki/Q567560","display_name":"Anomaly (physics)","level":2,"score":0.3133000135421753},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.298799991607666},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C2983241795","wikidata":"https://www.wikidata.org/wiki/Q6806500","display_name":"Medical decision making","level":2,"score":0.2678000032901764},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.26249998807907104}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.01081","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.01081","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.01081","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.01081","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7656911015510559}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Medical":[0],"Anomaly":[1],"Detection":[2],"(MedAD)":[3],"presents":[4],"a":[5,83,104,137,191],"significant":[6],"opportunity":[7],"to":[8,17,94,141,182,194],"enhance":[9],"diagnostic":[10,68],"accuracy":[11],"using":[12],"Large":[13],"Multimodal":[14],"Models":[15],"(LMMs)":[16],"interpret":[18],"and":[19,35,48,62,99,149,185,198],"answer":[20],"questions":[21],"based":[22],"on":[23,29,33,164],"medical":[24,97],"images.":[25],"However,":[26],"the":[27,40,58,101,120,123,143,153,165,196],"reliance":[28],"Supervised":[30],"Fine-Tuning":[31],"(SFT)":[32],"simplistic":[34],"fragmented":[36],"datasets":[37],"has":[38],"hindered":[39],"development":[41],"of":[42,45,200],"models":[43],"capable":[44],"plausible":[46],"reasoning":[47,115,145,188],"robust":[49],"multimodal":[50],"generalization.":[51],"To":[52],"overcome":[53],"this,":[54],"we":[55,81],"introduce":[56],"MedAD-38K,":[57],"first":[59,88],"large-scale,":[60],"multi-modal,":[61],"multi-center":[63],"benchmark":[64],"for":[65,202],"MedAD":[66],"featuring":[67],"Chain-of-Thought":[69],"(CoT)":[70],"annotations":[71],"alongside":[72],"structured":[73,105],"Visual":[74],"Question-Answering":[75],"(VQA)":[76],"pairs.":[77],"On":[78],"this":[79],"foundation,":[80],"propose":[82],"two-stage":[84],"training":[85],"framework.":[86],"The":[87],"stage,":[89],"Cognitive":[90],"Injection,":[91],"uses":[92],"SFT":[93],"instill":[95],"foundational":[96],"knowledge":[98],"align":[100],"model":[102],"with":[103,152],"think-then-answer":[106],"paradigm.":[107],"Given":[108],"that":[109,116],"standard":[110],"policy":[111],"optimization":[112],"can":[113],"produce":[114],"is":[117,147],"disconnected":[118],"from":[119,179],"final":[121,154],"answer,":[122],"second":[124],"stage":[125],"incorporates":[126,136],"Consistency":[127],"Group":[128],"Relative":[129],"Policy":[130],"Optimization":[131],"(Con-GRPO).":[132],"This":[133,175],"novel":[134],"algorithm":[135],"crucial":[138],"consistency":[139],"reward":[140],"ensure":[142],"generated":[144],"process":[146],"relevant":[148],"logically":[150,186],"coherent":[151],"diagnosis.":[155],"Our":[156],"proposed":[157],"model,":[158],"MedAD-R1,":[159],"achieves":[160],"state-of-the-art":[161],"(SOTA)":[162],"performance":[163,177],"MedAD-38K":[166],"benchmark,":[167],"outperforming":[168],"strong":[169],"baselines":[170],"by":[171],"more":[172],"than":[173],"10\\%.":[174],"superior":[176],"stems":[178],"its":[180],"ability":[181],"generate":[183],"transparent":[184],"consistent":[187],"pathways,":[189],"offering":[190],"promising":[192],"approach":[193],"enhancing":[195],"trustworthiness":[197],"interpretability":[199],"AI":[201],"clinical":[203],"decision":[204],"support.":[205]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-04T00:00:00"}
