{"id":"https://openalex.org/W7147557363","doi":"https://doi.org/10.48550/arxiv.2603.29025","title":"The Model Says Walk: How Surface Heuristics Override Implicit Constraints in LLM Reasoning","display_name":"The Model Says Walk: How Surface Heuristics Override Implicit Constraints in LLM Reasoning","publication_year":2026,"publication_date":"2026-03-30","ids":{"openalex":"https://openalex.org/W7147557363","doi":"https://doi.org/10.48550/arxiv.2603.29025"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.29025","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.29025","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.29025","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132664641","display_name":"Yubo Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Yubo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132655392","display_name":"Lu Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Lu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070703219","display_name":"Tianchong Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Tianchong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132568829","display_name":"Ramayya Krishnan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Krishnan, Ramayya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5046671743","display_name":"Rema Padman","orcid":"https://orcid.org/0000-0003-4250-4357"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Padman, Rema","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5132664641"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2766999900341034,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2766999900341034,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1615999937057495,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.15360000729560852,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.7279999852180481},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.7267000079154968},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.6873000264167786},{"id":"https://openalex.org/keywords/generality","display_name":"Generality","score":0.6766999959945679},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6279000043869019},{"id":"https://openalex.org/keywords/forcing","display_name":"Forcing (mathematics)","score":0.5138000249862671},{"id":"https://openalex.org/keywords/sigmoid-function","display_name":"Sigmoid function","score":0.4781999886035919},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.4546000063419342},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4172999858856201}],"concepts":[{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.7279999852180481},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.7267000079154968},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.6873000264167786},{"id":"https://openalex.org/C2780767217","wikidata":"https://www.wikidata.org/wiki/Q5532421","display_name":"Generality","level":2,"score":0.6766999959945679},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6279000043869019},{"id":"https://openalex.org/C197115733","wikidata":"https://www.wikidata.org/wiki/Q1003136","display_name":"Forcing (mathematics)","level":2,"score":0.5138000249862671},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49729999899864197},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.48590001463890076},{"id":"https://openalex.org/C81388566","wikidata":"https://www.wikidata.org/wiki/Q526668","display_name":"Sigmoid function","level":3,"score":0.4781999886035919},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.4546000063419342},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4172999858856201},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.4065999984741211},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3479999899864197},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.3418999910354614},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.32089999318122864},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3019999861717224},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29840001463890076},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2955000102519989},{"id":"https://openalex.org/C2776493592","wikidata":"https://www.wikidata.org/wiki/Q5158717","display_name":"Succinctness","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.27889999747276306},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.27399998903274536},{"id":"https://openalex.org/C44616089","wikidata":"https://www.wikidata.org/wiki/Q30158686","display_name":"Constraint satisfaction","level":3,"score":0.2734000086784363},{"id":"https://openalex.org/C2776799497","wikidata":"https://www.wikidata.org/wiki/Q484298","display_name":"Surface (topology)","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C24574437","wikidata":"https://www.wikidata.org/wiki/Q7135228","display_name":"Parametric model","level":3,"score":0.2703999876976013},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.2671000063419342},{"id":"https://openalex.org/C199622910","wikidata":"https://www.wikidata.org/wiki/Q1128326","display_name":"Constraint satisfaction problem","level":3,"score":0.25999999046325684},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.25929999351501465}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.29025","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.29025","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.29025","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.29025","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2,32,131,169],"systematically":[3],"fail":[4],"when":[5,134],"a":[6,20,182,188],"salient":[7],"surface":[8],"cue":[9,40],"conflicts":[10],"with":[11,58,79],"an":[12],"unstated":[13],"feasibility":[14],"constraint.":[15],"We":[16],"study":[17],"this":[18],"through":[19],"diagnose-measure-bridge-treat":[21],"framework.":[22],"Causal-behavioral":[23],"analysis":[24],"of":[25],"the":[26,38,49,111,120,135,150],"``car":[27],"wash":[28],"problem''":[29],"across":[30,88],"six":[31],"reveals":[33],"approximately":[34],"context-independent":[35],"sigmoid":[36,151],"heuristics:":[37],"distance":[39],"exerts":[41],"8.7":[42],"to":[43,140,154,164,170],"38":[44],"times":[45],"more":[46,56],"influence":[47],"than":[48,61,127],"goal,":[50],"and":[51,82,100,157,186],"token-level":[52],"attribution":[53],"shows":[54],"patterns":[55],"consistent":[57],"keyword":[59],"associations":[60],"compositional":[62],"inference.":[63],"The":[64],"Heuristic":[65],"Override":[66],"Benchmark":[67],"(HOB)":[68],"--":[69,85],"500":[70],"instances":[71],"spanning":[72],"4":[73],"heuristic":[74,179],"by":[75,167],"5":[76],"constraint":[77,124,136],"families":[78],"minimal":[80,107],"pairs":[81],"explicitness":[83],"gradients":[84],"demonstrates":[86],"generality":[87],"14":[89],"models:":[90],"under":[91],"strict":[92],"evaluation":[93],"(10/10":[94],"correct),":[95],"no":[96],"model":[97],"exceeds":[98],"75%,":[99],"presence":[101],"constraints":[102],"are":[103],"hardest":[104],"(44%).":[105],"A":[106],"hint":[108],"(e.g.,":[109],"emphasizing":[110],"key":[112],"object)":[113],"recovers":[114,162],"+15":[115],"pp":[116,166],"on":[117],"average,":[118],"suggesting":[119],"failure":[121],"lies":[122],"in":[123],"inference":[125],"rather":[126],"missing":[128],"knowledge;":[129],"12/14":[130],"perform":[132],"worse":[133],"is":[137],"removed":[138],"(up":[139],"-39":[141],"pp),":[142],"revealing":[143],"conservative":[144],"bias.":[145],"Parametric":[146],"probes":[147],"confirm":[148],"that":[149],"pattern":[152],"generalizes":[153],"cost,":[155],"efficiency,":[156],"semantic-similarity":[158],"heuristics;":[159],"goal-decomposition":[160],"prompting":[161],"+6":[163],"9":[165],"forcing":[168],"enumerate":[171],"preconditions":[172],"before":[173],"answering.":[174],"Together,":[175],"these":[176],"results":[177],"characterize":[178],"override":[180],"as":[181],"systematic":[183],"reasoning":[184],"vulnerability":[185],"provide":[187],"benchmark":[189],"for":[190],"measuring":[191],"progress":[192],"toward":[193],"resolving":[194],"it.":[195]},"counts_by_year":[],"updated_date":"2026-05-03T08:25:01.440150","created_date":"2026-04-02T00:00:00"}
