{"id":"https://openalex.org/W7154632117","doi":"https://doi.org/10.48550/arxiv.2604.13371","title":"Empirical Evidence of Complexity-Induced Limits in Large Language Models on Finite Discrete State-Space Problems with Explicit Validity Constraints","display_name":"Empirical Evidence of Complexity-Induced Limits in Large Language Models on Finite Discrete State-Space Problems with Explicit Validity Constraints","publication_year":2026,"publication_date":"2026-04-15","ids":{"openalex":"https://openalex.org/W7154632117","doi":"https://doi.org/10.48550/arxiv.2604.13371"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.13371","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13371","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.13371","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5117481317","display_name":"Md. Fahad Ullah Utsho","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Utsho, Md. Fahad Ullah","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133776883","display_name":"Mohd. Ruhul Ameen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ameen, Mohd. Ruhul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063245603","display_name":"Akif Islam","orcid":"https://orcid.org/0009-0004-2755-7316"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Islam, Akif","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133772046","display_name":"Md. Golam Rashed","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rashed, Md. Golam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133732717","display_name":"Dipankar Das","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Das, Dipankar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5117481317"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.17579999566078186,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.17579999566078186,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.1371999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.11420000344514847,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parameterized-complexity","display_name":"Parameterized complexity","score":0.6154000163078308},{"id":"https://openalex.org/keywords/automated-reasoning","display_name":"Automated reasoning","score":0.45719999074935913},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.44530001282691956},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.40220001339912415},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.38339999318122864},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.38199999928474426},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.3799000084400177},{"id":"https://openalex.org/keywords/commonsense-reasoning","display_name":"Commonsense reasoning","score":0.34540000557899475},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.336899995803833}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6410999894142151},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.6154000163078308},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.5450999736785889},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.45719999074935913},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.44530001282691956},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.40220001339912415},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.38339999318122864},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.38199999928474426},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.3799000084400177},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3635999858379364},{"id":"https://openalex.org/C193221554","wikidata":"https://www.wikidata.org/wiki/Q5153664","display_name":"Commonsense reasoning","level":2,"score":0.34540000557899475},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.336899995803833},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.33500000834465027},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.3183000087738037},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.29919999837875366},{"id":"https://openalex.org/C71889745","wikidata":"https://www.wikidata.org/wiki/Q1783264","display_name":"Counterfactual conditional","level":3,"score":0.29660001397132874},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.29660001397132874},{"id":"https://openalex.org/C44616089","wikidata":"https://www.wikidata.org/wiki/Q30158686","display_name":"Constraint satisfaction","level":3,"score":0.295199990272522},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2793999910354614},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.2727999985218048},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C199622910","wikidata":"https://www.wikidata.org/wiki/Q1128326","display_name":"Constraint satisfaction problem","level":3,"score":0.272599995136261},{"id":"https://openalex.org/C110251889","wikidata":"https://www.wikidata.org/wiki/Q1569697","display_name":"Model checking","level":2,"score":0.2718000113964081},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.2581999897956848}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.13371","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13371","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.13371","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13371","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0,59],"Language":[1],"Models":[2,61],"(LLMs)":[3],"are":[4,128],"increasingly":[5],"described":[6],"as":[7,38,158],"possessing":[8],"strong":[9],"reasoning":[10,35,57,75,159,174,187,221],"capabilities,":[11],"supported":[12],"by":[13,172],"high":[14,119,141],"performance":[15],"on":[16,27],"mathematical,":[17],"logical,":[18],"and":[19,92,112,118,182,194,218],"planning":[20],"benchmarks.":[21],"However,":[22],"most":[23],"existing":[24],"evaluations":[25],"rely":[26],"aggregate":[28],"accuracy":[29,142,166],"over":[30],"fixed":[31],"datasets,":[32],"obscuring":[33],"how":[34],"behavior":[36],"evolves":[37],"task":[39,150],"complexity":[40,100,120,145,152],"increases.":[41],"In":[42],"this":[43,156],"work,":[44],"we":[45,108,163],"introduce":[46],"a":[47,70,133],"controlled":[48,224],"benchmarking":[49],"framework":[50],"to":[51,97,203],"systematically":[52],"evaluate":[53,109],"the":[54,208],"robustness":[55,222],"of":[56,72,85,179],"in":[58,196],"Reasoning":[60],"(LRMs)":[62],"under":[63,223],"progressively":[64],"increasing":[65],"problem":[66,198],"complexity.":[67,225],"We":[68,154],"construct":[69],"suite":[71],"nine":[73],"classical":[74],"tasks:":[76],"Boolean":[77],"Satisfiability,":[78],"Cryptarithmetic,":[79],"Graph":[80],"Coloring,":[81],"River":[82],"Crossing,":[83],"Tower":[84],"Hanoi,":[86],"Water":[87],"Jug,":[88],"Checker":[89],"Jumping,":[90],"Sudoku,":[91],"Rubik's":[93],"Cube,":[94],"each":[95],"parameterized":[96],"precisely":[98],"control":[99],"while":[101],"preserving":[102],"underlying":[103],"semantics.":[104],"Using":[105],"deterministic":[106],"validators,":[107],"multiple":[110],"open":[111],"proprietary":[113],"LRMs":[114],"across":[115],"low,":[116],"intermediate,":[117],"regimes,":[121],"ensuring":[122],"that":[123,213],"only":[124],"fully":[125],"valid":[126],"solutions":[127],"accepted.":[129],"Our":[130],"results":[131],"reveal":[132],"consistent":[134],"phase":[135],"transition":[136],"like":[137],"behavior:":[138],"models":[139],"achieve":[140],"at":[143],"low":[144],"but":[146],"degrade":[147],"sharply":[148],"beyond":[149,215],"specific":[151],"thresholds.":[153],"formalize":[155],"phenomenon":[157],"collapse.":[160],"Across":[161],"tasks,":[162],"observe":[164],"substantial":[165],"declines,":[167],"often":[168],"exceeding":[169],"50%,":[170],"accompanied":[171],"inconsistent":[173],"traces,":[175],"constraint":[176],"violations,":[177],"loss":[178],"state":[180],"tracking,":[181],"confidently":[183],"incorrect":[184],"outputs.":[185],"Increased":[186],"length":[188],"does":[189],"not":[190,201],"reliably":[191],"improve":[192],"correctness,":[193],"gains":[195],"one":[197],"family":[199],"do":[200],"generalize":[202],"others.":[204],"These":[205],"findings":[206],"highlight":[207],"need":[209],"for":[210],"evaluation":[211],"methodologies":[212],"move":[214],"static":[216],"benchmarks":[217],"explicitly":[219],"measure":[220]},"counts_by_year":[],"updated_date":"2026-05-03T08:25:01.440150","created_date":"2026-04-17T00:00:00"}
