{"id":"https://openalex.org/W7160608640","doi":"https://doi.org/10.48550/arxiv.2605.06445","title":"Constraint Decay: The Fragility of LLM Agents in Backend Code Generation","display_name":"Constraint Decay: The Fragility of LLM Agents in Backend Code Generation","publication_year":2026,"publication_date":"2026-05-07","ids":{"openalex":"https://openalex.org/W7160608640","doi":"https://doi.org/10.48550/arxiv.2605.06445"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.06445","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06445","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.06445","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120721042","display_name":"Francesco Dente","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dente, Francesco","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135670242","display_name":"Dario Satriani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Satriani, Dario","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5011336242","display_name":"Paolo Papotti","orcid":"https://orcid.org/0000-0003-0651-4128"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Papotti, Paolo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.44130000472068787,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.44130000472068787,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.07090000063180923,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.04479999840259552,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fragility","display_name":"Fragility","score":0.5810999870300293},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.5213000178337097},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5098999738693237},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.47609999775886536},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.43849998712539673},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.41119998693466187},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.38749998807907104},{"id":"https://openalex.org/keywords/code-generation","display_name":"Code generation","score":0.33219999074935913}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7738000154495239},{"id":"https://openalex.org/C80191262","wikidata":"https://www.wikidata.org/wiki/Q5477668","display_name":"Fragility","level":2,"score":0.5810999870300293},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.5213000178337097},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5098999738693237},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.47609999775886536},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.43849998712539673},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.41119998693466187},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.41119998693466187},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.38749998807907104},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.36230000853538513},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.33219999074935913},{"id":"https://openalex.org/C40422974","wikidata":"https://www.wikidata.org/wiki/Q741248","display_name":"Assertion","level":2,"score":0.33000001311302185},{"id":"https://openalex.org/C199519371","wikidata":"https://www.wikidata.org/wiki/Q942695","display_name":"Source lines of code","level":3,"score":0.33000001311302185},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.3244999945163727},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.32330000400543213},{"id":"https://openalex.org/C44616089","wikidata":"https://www.wikidata.org/wiki/Q30158686","display_name":"Constraint satisfaction","level":3,"score":0.31290000677108765},{"id":"https://openalex.org/C145644426","wikidata":"https://www.wikidata.org/wiki/Q169411","display_name":"Unified Modeling Language","level":3,"score":0.30720001459121704},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.30160000920295715},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.2985000014305115},{"id":"https://openalex.org/C2779639559","wikidata":"https://www.wikidata.org/wiki/Q7661178","display_name":"Symbolic execution","level":3,"score":0.2799000144004822},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.2786000072956085},{"id":"https://openalex.org/C133264317","wikidata":"https://www.wikidata.org/wiki/Q1397689","display_name":"Object Constraint Language","level":5,"score":0.27549999952316284},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.2709999978542328},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.2651999890804291},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.25699999928474426},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.25290000438690186}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.06445","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06445","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.06445","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06445","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.43200573325157166,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Model":[2],"(LLM)":[3],"agents":[4,54,147],"demonstrate":[5],"strong":[6],"performance":[7,112,145],"in":[8,58,124,149,161],"autonomous":[9],"code":[10],"generation":[11,71],"under":[12],"loose":[13],"specifications.":[14],"However,":[15],"production-grade":[16],"software":[17],"requires":[18],"strict":[19],"adherence":[20],"to":[21,130],"structural":[22,56,86,108,194],"constraints,":[23],"such":[24],"as":[25,107,181],"architectural":[26],"patterns,":[27],"databases,":[28],"and":[29,73,96,177,193],"object-relational":[30],"mappings.":[31],"Existing":[32],"benchmarks":[33],"often":[34],"overlook":[35],"these":[36],"non-functional":[37],"requirements,":[38],"rewarding":[39],"functionally":[40],"correct":[41],"but":[42,155],"structurally":[43],"arbitrary":[44],"solutions.":[45],"We":[46],"present":[47],"a":[48,64,89,102,114,197],"systematic":[49],"study":[50],"evaluating":[51],"how":[52],"well":[53],"handle":[55],"constraints":[57],"multi-file":[59],"backend":[60],"generation.":[61],"By":[62],"fixing":[63],"unified":[65],"API":[66],"contract":[67],"across":[68],"80":[69],"greenfield":[70],"tasks":[72,76],"20":[74],"feature-implementation":[75],"spanning":[77],"eight":[78],"web":[79],"frameworks,":[80],"we":[81],"isolate":[82],"the":[83,182],"effect":[84],"of":[85,104],"complexity":[87],"using":[88],"dual":[90],"evaluation":[91],"with":[92],"end-to-end":[93],"behavioral":[94],"tests":[95],"static":[97],"verifiers.":[98],"Our":[99],"findings":[100],"reveal":[101],"phenomenon":[103],"constraint":[105],"decay:":[106],"requirements":[109,195],"accumulate,":[110],"agent":[111],"exhibits":[113],"substantial":[115],"decline.":[116],"Capable":[117],"configurations":[118,137],"lose":[119],"30":[120],"points":[121],"on":[122,159],"average":[123,160],"assertion":[125],"pass":[126],"rates":[127],"from":[128],"baseline":[129],"fully":[131],"specified":[132],"tasks,":[133],"while":[134],"some":[135],"weaker":[136],"approach":[138],"zero.":[139],"Framework":[140],"sensitivity":[141],"analysis":[142,169],"exposes":[143],"significant":[144],"disparities:":[146],"succeed":[148],"minimal,":[150],"explicit":[151],"frameworks":[152],"(e.g.,":[153,164,173],"Flask)":[154],"perform":[156],"substantially":[157],"worse":[158],"convention-heavy":[162],"environments":[163],"FastAPI,":[165],"Django).":[166],"Finally,":[167],"error":[168],"identifies":[170],"data-layer":[171],"defects":[172],"incorrect":[174],"query":[175],"composition":[176],"ORM":[178],"runtime":[179],"violations)":[180],"leading":[183],"root":[184],"causes.":[185],"This":[186],"work":[187],"highlights":[188],"that":[189],"jointly":[190],"satisfying":[191],"functional":[192],"remains":[196],"key":[198],"open":[199],"challenge":[200],"for":[201],"coding":[202],"agents.":[203]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-09T00:00:00"}
