{"id":"https://openalex.org/W7150730839","doi":"https://doi.org/10.48550/arxiv.2604.02733","title":"DeltaLogic: Minimal Premise Edits Reveal Belief-Revision Failures in Logical Reasoning Models","display_name":"DeltaLogic: Minimal Premise Edits Reveal Belief-Revision Failures in Logical Reasoning Models","publication_year":2026,"publication_date":"2026-04-03","ids":{"openalex":"https://openalex.org/W7150730839","doi":"https://doi.org/10.48550/arxiv.2604.02733"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.02733","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02733","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.02733","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043887050","display_name":"Amit Dhanda","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dhanda, Amit","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5043887050"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.2563999891281128,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.2563999891281128,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2214999943971634,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.11320000141859055,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/premise","display_name":"Premise","score":0.8449000120162964},{"id":"https://openalex.org/keywords/belief-revision","display_name":"Belief revision","score":0.5777000188827515},{"id":"https://openalex.org/keywords/automated-reasoning","display_name":"Automated reasoning","score":0.5472999811172485},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5188000202178955},{"id":"https://openalex.org/keywords/logical-consequence","display_name":"Logical consequence","score":0.4465999901294708},{"id":"https://openalex.org/keywords/non-monotonic-logic","display_name":"Non-monotonic logic","score":0.41620001196861267},{"id":"https://openalex.org/keywords/model-based-reasoning","display_name":"Model-based reasoning","score":0.4083999991416931},{"id":"https://openalex.org/keywords/abductive-reasoning","display_name":"Abductive reasoning","score":0.4043999910354614}],"concepts":[{"id":"https://openalex.org/C2778023277","wikidata":"https://www.wikidata.org/wiki/Q321703","display_name":"Premise","level":2,"score":0.8449000120162964},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6068000197410583},{"id":"https://openalex.org/C128913409","wikidata":"https://www.wikidata.org/wiki/Q3566063","display_name":"Belief revision","level":2,"score":0.5777000188827515},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.5472999811172485},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5336999893188477},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5188000202178955},{"id":"https://openalex.org/C134752490","wikidata":"https://www.wikidata.org/wiki/Q374182","display_name":"Logical consequence","level":2,"score":0.4465999901294708},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.41620001196861267},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.4083999991416931},{"id":"https://openalex.org/C166088908","wikidata":"https://www.wikidata.org/wiki/Q308495","display_name":"Abductive reasoning","level":2,"score":0.4043999910354614},{"id":"https://openalex.org/C86827895","wikidata":"https://www.wikidata.org/wiki/Q7098582","display_name":"Opportunistic reasoning","level":4,"score":0.4016999900341034},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.3939000070095062},{"id":"https://openalex.org/C97364631","wikidata":"https://www.wikidata.org/wiki/Q484284","display_name":"Deductive reasoning","level":2,"score":0.38600000739097595},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.36800000071525574},{"id":"https://openalex.org/C73301696","wikidata":"https://www.wikidata.org/wiki/Q5469984","display_name":"Formalism (music)","level":3,"score":0.36059999465942383},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.34940001368522644},{"id":"https://openalex.org/C43971567","wikidata":"https://www.wikidata.org/wiki/Q3142865","display_name":"Logical reasoning","level":2,"score":0.34310001134872437},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3221000134944916},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C2778790839","wikidata":"https://www.wikidata.org/wiki/Q6667497","display_name":"Logical form","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.25619998574256897},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.25369998812675476}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.02733","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02733","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.02733","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02733","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.415053129196167,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Reasoning":[0],"benchmarks":[1],"typically":[2],"evaluate":[3,88],"whether":[4,70],"a":[5,12,19,37,63,98,197],"model":[6],"derives":[7],"the":[8,71,132,147],"correct":[9],"answer":[10],"from":[11,83],"fixed":[13,182],"premise":[14],"set,":[15],"but":[16,119,167],"they":[17],"under-measure":[18],"closely":[20],"related":[21],"capability":[22,203],"that":[23,41,178,204],"matters":[24],"in":[25],"dynamic":[26],"environments:":[27],"belief":[28,188],"revision":[29,48,112,122,189],"under":[30,58,181],"minimal":[31,64],"evidence":[32,192],"change.":[33],"We":[34,80],"introduce":[35],"DeltaLogic,":[36],"benchmark":[38],"transformation":[39],"protocol":[40],"converts":[42],"natural-language":[43],"reasoning":[44,106,202],"examples":[45],"into":[46,140],"short":[47],"episodes.":[49],"Each":[50],"episode":[51],"first":[52],"asks":[53,69],"for":[54],"an":[55],"initial":[56,105,117],"conclusion":[57,73],"premises":[59,183],"P,":[60],"then":[61],"applies":[62],"edit":[65],"\u03b4(P),":[66],"and":[67,85,87,172,199,209],"finally":[68],"previous":[72],"should":[74,135],"remain":[75],"stable":[76],"or":[77],"be":[78],"revised.":[79],"instantiate":[81],"DeltaLogic":[82,194],"FOLIO":[84],"ProofWriter":[86],"small":[89],"causal":[90],"language":[91],"models":[92],"with":[93,124],"constrained":[94],"label":[95,134],"scoring.":[96],"On":[97],"completed":[99],"30-episode":[100],"Qwen":[101],"evaluation":[102],"subset,":[103],"stronger":[104,111,162],"still":[107,168],"does":[108,184],"not":[109,185],"imply":[110,186],"behavior:":[113],"Qwen3-1.7B":[114],"reaches":[115],"0.667":[116],"accuracy":[118],"only":[120],"0.467":[121],"accuracy,":[123],"inertia":[125],"rising":[126],"to":[127],"0.600":[128,156],"on":[129],"episodes":[130],"where":[131],"gold":[133],"change,":[136],"while":[137],"Qwen3-0.6B":[138],"collapses":[139],"near":[141],"universal":[142],"abstention.":[143],"There,":[144],"Qwen3-4B":[145],"preserves":[146],"same":[148],"inertial":[149],"failure":[150],"pattern":[151],"(0.650":[152],"initial,":[153,164],"0.450":[154],"revised,":[155],"inertia),":[157],"whereas":[158],"Phi-4-mini-instruct":[159],"is":[160],"substantially":[161],"(0.950":[163],"0.850":[165],"revised)":[166],"exhibits":[169],"non-trivial":[170],"abstention":[171],"control":[173],"instability.":[174],"These":[175],"results":[176],"suggest":[177],"logical":[179,207],"competence":[180],"disciplined":[187],"after":[190],"local":[191],"edits.":[193],"therefore":[195],"targets":[196],"distinct":[198],"practically":[200],"important":[201],"complements":[205],"existing":[206],"inference":[208],"belief-updating":[210],"benchmarks.":[211]},"counts_by_year":[],"updated_date":"2026-04-07T06:06:30.997549","created_date":"2026-04-07T00:00:00"}
