{"id":"https://openalex.org/W7151759246","doi":"https://doi.org/10.48550/arxiv.2604.05407","title":"CODESTRUCT: Code Agents over Structured Action Spaces","display_name":"CODESTRUCT: Code Agents over Structured Action Spaces","publication_year":2026,"publication_date":"2026-04-07","ids":{"openalex":"https://openalex.org/W7151759246","doi":"https://doi.org/10.48550/arxiv.2604.05407"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.05407","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05407","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.05407","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133148216","display_name":"Myeongsoo Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kim, Myeongsoo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133217995","display_name":"Joe Hsu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hsu, Joe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056754361","display_name":"Dingmin Wang","orcid":"https://orcid.org/0000-0001-9196-2624"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Dingmin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128446545","display_name":"Shweta Garg","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Garg, Shweta","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133180856","display_name":"Varun Kumar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kumar, Varun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133180015","display_name":"Murali Krishna Ramanathan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramanathan, Murali Krishna","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5133148216"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.5462999939918518,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.5462999939918518,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.11869999766349792,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.04800000041723251,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/codebase","display_name":"Codebase","score":0.5306000113487244},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5151000022888184},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.4684000015258789},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.44020000100135803},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4027000069618225},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4000999927520752},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.37869998812675476},{"id":"https://openalex.org/keywords/disk-formatting","display_name":"Disk formatting","score":0.34860000014305115},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.3391000032424927}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8116000294685364},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.5491999983787537},{"id":"https://openalex.org/C51929080","wikidata":"https://www.wikidata.org/wiki/Q2425187","display_name":"Codebase","level":3,"score":0.5306000113487244},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5151000022888184},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.4684000015258789},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.44020000100135803},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4027000069618225},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4000999927520752},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.37869998812675476},{"id":"https://openalex.org/C88006597","wikidata":"https://www.wikidata.org/wiki/Q690117","display_name":"Disk formatting","level":2,"score":0.34860000014305115},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.3391000032424927},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3077000081539154},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.29980000853538513},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.29440000653266907},{"id":"https://openalex.org/C2778531742","wikidata":"https://www.wikidata.org/wiki/Q17009281","display_name":"Discoverability","level":2,"score":0.29260000586509705},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2881999909877777},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28459998965263367},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.27959999442100525},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C167254554","wikidata":"https://www.wikidata.org/wiki/Q338451","display_name":"Escrow","level":2,"score":0.2768999934196472},{"id":"https://openalex.org/C193702766","wikidata":"https://www.wikidata.org/wiki/Q1414548","display_name":"Concurrency","level":2,"score":0.275299996137619},{"id":"https://openalex.org/C150292731","wikidata":"https://www.wikidata.org/wiki/Q1342704","display_name":"Code review","level":5,"score":0.27219998836517334},{"id":"https://openalex.org/C175291020","wikidata":"https://www.wikidata.org/wiki/Q1156822","display_name":"Offset (computer science)","level":2,"score":0.26910001039505005},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.2669000029563904},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2630999982357025},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.2623000144958496},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.2538999915122986},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2533999979496002},{"id":"https://openalex.org/C75701414","wikidata":"https://www.wikidata.org/wiki/Q1651672","display_name":"Boilerplate text","level":2,"score":0.2524999976158142},{"id":"https://openalex.org/C187029079","wikidata":"https://www.wikidata.org/wiki/Q958679","display_name":"Cognitive reframing","level":2,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.05407","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05407","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.05407","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05407","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"LLM-based":[0],"code":[1,138],"agents":[2,35],"treat":[3],"repositories":[4],"as":[5,29,104],"unstructured":[6],"text,":[7],"applying":[8,58],"edits":[9],"through":[10],"brittle":[11],"string":[12],"matching":[13],"that":[14,88,129],"frequently":[15,89],"fails":[16],"due":[17],"to":[18,61,91,110,124],"formatting":[19],"drift":[20],"or":[21],"ambiguous":[22],"patterns.":[23],"We":[24],"propose":[25],"reframing":[26],"the":[27],"codebase":[28],"a":[30,133],"structured":[31],"action":[32],"space":[33],"where":[34],"operate":[36],"on":[37,66],"named":[38],"AST":[39],"entities":[40],"rather":[41],"than":[42],"text":[43],"spans.":[44],"Our":[45,126],"framework,":[46],"CODESTRUCT,":[47],"provides":[48],"readCode":[49],"for":[50,57,84,137],"retrieving":[51],"complete":[52],"syntactic":[53],"units":[54],"and":[55],"editCode":[56],"syntax-validated":[59],"transformations":[60],"semantic":[62],"program":[63],"elements.":[64],"Evaluated":[65],"SWE-Bench":[67],"Verified":[68],"across":[69],"six":[70],"LLMs,":[71],"CODESTRUCT":[72],"improves":[73,101],"Pass@1":[74],"accuracy":[75,117],"by":[76,82,102],"1.2-5.0%":[77],"while":[78],"reducing":[79],"token":[80],"consumption":[81],"12-38%":[83],"most":[85],"models.":[86],"Models":[87],"fail":[90],"produce":[92],"valid":[93],"patches":[94],"under":[95],"text-based":[96],"interfaces":[97,131],"benefit":[98],"most:":[99],"GPT-5-nano":[100],"20.8%":[103],"empty-patch":[105],"failures":[106],"drop":[107],"from":[108],"46.6%":[109],"7.2%.":[111],"On":[112],"CodeAssistBench,":[113],"we":[114],"observe":[115],"consistent":[116],"gains":[118],"(+0.8-4.4%)":[119],"with":[120],"cost":[121],"reductions":[122],"up":[123],"33%.":[125],"results":[127],"show":[128],"structure-aware":[130],"offer":[132],"more":[134],"reliable":[135],"foundation":[136],"agents.":[139]},"counts_by_year":[],"updated_date":"2026-04-09T06:13:59.934233","created_date":"2026-04-09T00:00:00"}
