{"id":"https://openalex.org/W7154099677","doi":"https://doi.org/10.48550/arxiv.2604.09537","title":"Case-Grounded Evidence Verification: A Framework for Constructing Evidence-Sensitive Supervision","display_name":"Case-Grounded Evidence Verification: A Framework for Constructing Evidence-Sensitive Supervision","publication_year":2026,"publication_date":"2026-04-10","ids":{"openalex":"https://openalex.org/W7154099677","doi":"https://doi.org/10.48550/arxiv.2604.09537"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.09537","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.09537","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.09537","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076251937","display_name":"Soroosh Tayebi Arasteh","orcid":"https://orcid.org/0000-0003-1015-7733"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Arasteh, Soroosh Tayebi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034113400","display_name":"Mehdi Joodaki","orcid":"https://orcid.org/0000-0002-2184-7118"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Joodaki, Mehdi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040088150","display_name":"Mahshad Lotfinia","orcid":"https://orcid.org/0000-0001-7605-7992"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lotfinia, Mahshad","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091689170","display_name":"Sven Nebelung","orcid":"https://orcid.org/0000-0002-5267-9962"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nebelung, Sven","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5016512818","display_name":"Daniel Truhn","orcid":"https://orcid.org/0000-0002-9605-0728"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Truhn, Daniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5076251937"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.550599992275238,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.550599992275238,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.09679999947547913,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12574","display_name":"Clinical Reasoning and Diagnostic Skills","score":0.04729999974370003,"subfield":{"id":"https://openalex.org/subfields/2714","display_name":"Family Practice"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.7785000205039978},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6425999999046326},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5956000089645386},{"id":"https://openalex.org/keywords/empirical-evidence","display_name":"Empirical evidence","score":0.46219998598098755},{"id":"https://openalex.org/keywords/blame","display_name":"Blame","score":0.4345000088214874},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.41600000858306885},{"id":"https://openalex.org/keywords/parallels","display_name":"Parallels","score":0.3817000091075897},{"id":"https://openalex.org/keywords/argument","display_name":"Argument (complex analysis)","score":0.3725999891757965}],"concepts":[{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.7785000205039978},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6425999999046326},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6291999816894531},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5956000089645386},{"id":"https://openalex.org/C166052673","wikidata":"https://www.wikidata.org/wiki/Q83021","display_name":"Empirical evidence","level":2,"score":0.46219998598098755},{"id":"https://openalex.org/C2781466463","wikidata":"https://www.wikidata.org/wiki/Q621695","display_name":"Blame","level":2,"score":0.4345000088214874},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.41600000858306885},{"id":"https://openalex.org/C2775922551","wikidata":"https://www.wikidata.org/wiki/Q7135033","display_name":"Parallels","level":2,"score":0.3817000091075897},{"id":"https://openalex.org/C98184364","wikidata":"https://www.wikidata.org/wiki/Q1780131","display_name":"Argument (complex analysis)","level":2,"score":0.3725999891757965},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.3634999990463257},{"id":"https://openalex.org/C71889745","wikidata":"https://www.wikidata.org/wiki/Q1783264","display_name":"Counterfactual conditional","level":3,"score":0.33250001072883606},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33169999718666077},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.328900009393692},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3278000056743622},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.3176000118255615},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.31040000915527344},{"id":"https://openalex.org/C141330323","wikidata":"https://www.wikidata.org/wiki/Q2354820","display_name":"Evidence-based practice","level":3,"score":0.3059000074863434},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.28769999742507935},{"id":"https://openalex.org/C80114427","wikidata":"https://www.wikidata.org/wiki/Q634260","display_name":"Circumstantial evidence","level":2,"score":0.2840000092983246},{"id":"https://openalex.org/C2779010991","wikidata":"https://www.wikidata.org/wiki/Q2720909","display_name":"Artifact (error)","level":2,"score":0.28279998898506165},{"id":"https://openalex.org/C11671645","wikidata":"https://www.wikidata.org/wiki/Q5054567","display_name":"Causal model","level":2,"score":0.27799999713897705},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.265500009059906},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.25940001010894775},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.2556000053882599},{"id":"https://openalex.org/C195094911","wikidata":"https://www.wikidata.org/wiki/Q14167904","display_name":"Process management","level":1,"score":0.25290000438690186},{"id":"https://openalex.org/C2777877512","wikidata":"https://www.wikidata.org/wiki/Q1116097","display_name":"Common ground","level":2,"score":0.25209999084472656},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.25049999356269836}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.09537","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.09537","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.09537","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.09537","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7725281119346619,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Evidence-grounded":[0],"reasoning":[1],"requires":[2],"more":[3],"than":[4],"attaching":[5],"retrieved":[6],"text":[7],"to":[8,41,180],"a":[9,11,57,62,65,72,91,124,188],"prediction:":[10],"model":[12,63,197],"should":[13],"make":[14],"decisions":[15],"that":[16,85,95,187,204],"depend":[17],"on":[18,127],"whether":[19,78],"the":[20,24,42,79,82,118,128,184,200,206],"provided":[21],"evidence":[22,36,49,55,80,114,150,157,164,192],"supports":[23,81],"target":[25],"claim.":[26],"In":[27],"practice,":[28],"this":[29],"often":[30],"fails":[31],"because":[32],"supervision":[33,92,203],"is":[34,37,90,151,194],"weak,":[35],"only":[38,196],"loosely":[39],"tied":[40],"claim,":[43,74],"and":[44,71,75,109,122,139,147,166,177],"evaluation":[45],"does":[46],"not":[47,195],"test":[48],"dependence":[50],"directly.":[51],"We":[52,116],"introduce":[53],"case-grounded":[54],"verification,":[56],"general":[58],"framework":[59,119],"in":[60,120,191],"which":[61],"receives":[64],"local":[66],"case":[67,169],"context,":[68],"external":[69,168],"evidence,":[70,146],"structured":[73],"must":[76],"decide":[77],"claim":[83],"for":[84],"case.":[86],"Our":[87],"key":[88],"contribution":[89],"construction":[93],"procedure":[94],"generates":[96],"explicit":[97],"support":[98,130],"examples":[99],"together":[100],"with":[101],"semantically":[102],"controlled":[103],"non-support":[104],"examples,":[105],"including":[106],"counterfactual":[107],"wrong-state":[108],"topic-related":[110],"negatives,":[111],"without":[112],"manual":[113],"annotation.":[115],"instantiate":[117],"radiology":[121],"train":[123],"standard":[125],"verifier":[126,134],"resulting":[129],"task.":[131],"The":[132],"learned":[133],"substantially":[135],"outperforms":[136],"both":[137],"case-only":[138],"evidence-only":[140],"baselines,":[141],"remains":[142,178],"strong":[143],"under":[144,174],"correct":[145],"collapses":[148],"when":[149],"removed":[152],"or":[153],"swapped,":[154],"indicating":[155],"genuine":[156],"dependence.":[158],"This":[159],"behavior":[160],"transfers":[161],"across":[162],"unseen":[163],"articles":[165],"an":[167],"distribution,":[170],"though":[171],"performance":[172],"degrades":[173],"evidence-source":[175],"shift":[176],"sensitive":[179],"backbone":[181],"choice.":[182],"Overall,":[183],"results":[185],"suggest":[186],"major":[189],"bottleneck":[190],"grounding":[193],"capacity,":[198],"but":[199],"lack":[201],"of":[202,209],"encodes":[205],"causal":[207],"role":[208],"evidence.":[210]},"counts_by_year":[],"updated_date":"2026-05-04T08:30:34.212998","created_date":"2026-04-14T00:00:00"}
